{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "fdf791e6",
   "metadata": {},
   "outputs": [],
   "source": [
    "用户输入的地区 = input"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "ebb68a24",
   "metadata": {},
   "outputs": [],
   "source": [
    "import requests\n",
    "import json\n",
    "\n",
    "url = \"https://api-c.liepin.com/api/com.liepin.searchfront4c.pc-search-job\"\n",
    "payload = {\n",
    "    \"data\": {\n",
    "        \"mainSearchPcConditionForm\": {\n",
    "            \"city\": \"用户输入的地区\",\n",
    "            \"pubTime\": \"\",\n",
    "            \"currentPage\": 0,\n",
    "            \"pageSize\": 40,\n",
    "            \"key\": \"用户输入的岗位\",\n",
    "            \"suggestTag\": \"\",\n",
    "            \"workYearCode\": \"0\",\n",
    "            \"compId\": \"\",\n",
    "            \"compName\": \"\",\n",
    "            \"compTag\": \"\",\n",
    "            \"industry\": \"\",\n",
    "            \"salary\": \"\",\n",
    "            \"jobKind\": \"\",\n",
    "            \"compScale\": \"\",\n",
    "            \"compKind\": \"\",\n",
    "            \"compStage\": \"\",\n",
    "            \"eduLevel\": \"\"\n",
    "        },\n",
    "        \"passThroughForm\": {\n",
    "            \"scene\": \"input\",\n",
    "            \"skId\": \"\",\n",
    "            \"fkId\": \"\",\n",
    "            \"ckId\": \"h2c8pxojavrmo1w785z7ueih2ybfpux8\",\n",
    "            \"suggest\": None\n",
    "        }\n",
    "    }\n",
    "}\n",
    "\n",
    "\n",
    "\n",
    "# set the headers\n",
    "headers = {\n",
    "    'Accept':'application/json, text/plain, */*',\n",
    "    'Accept-Encoding':'gzip, deflate, br',\n",
    "    'Accept-Language':'zh-CN,zh;q=0.9',\n",
    "    'Connection':'keep-alive',\n",
    "    'Content-Len,gth':'481',\n",
    "    'Content-Type':'application/json;charset=UTF-8;',\n",
    "    'Cookie':'inited_user=1dd9ec13c450e889bbbdf0c59550b6b7; __gc_id=5d33306e72ce4b0186c45865e0922810; __uuid=1679039529657.44; _ga=GA1.1.434120596.1681917222; need_bind_tel=false; new_user=false; c_flag=e25d5905dfe4d5bf9737a08ef6961e7c; imClientId=69a80dbfb86321fde4e79498d74426d3; imId=69a80dbfb86321fd0db887e0f6b8d42d; imClientId_0=69a80dbfb86321fde4e79498d74426d3; imId_0=69a80dbfb86321fd0db887e0f6b8d42d; XSRF-TOKEN=dQmzmiAWSqiDPe788r3rxg; user_roles=0; user_photo=5f8fa3bddfb13a7dee343d7608u.png; user_name=%E6%9D%8E%E9%93%B8%E6%B3%A2; inited_user=1dd9ec13c450e889bbbdf0c59550b6b7; imApp_0=1; __tlog=1683874528420.02%7C00000000%7C00000000%7Cs_o_001%7CFavsk7rH; b-u-category=1; Hm_lvt_a2647413544f5a04f00da7eee0d5e200=1683874529; acw_tc=276082a916842141050373388e314a217632dffcffa3c563e46a28be2f0f58; UniqueKey=81b18052d529ff237ecd4408bb1e9b04; liepin_login_valid=0; lt_auth=vexYbnwFnA2r5HaLjDEM568Z2durVjrO%2FS4L1BEE19LvD6Ww4P%2FmQQ6Aq7cD%2FCoIqxtxfvwzMLb2Mer%2FzXJP70sW%2F1GnlZ6utf6k1X4eTuZtHuyflMXuqsjQQ5wtrXo6ykpgn2si0HU%3D; access_system=C; Hm_lpvt_a2647413544f5a04f00da7eee0d5e200=1684214174; fe_im_connectJson_0=%7B%220_81b18052d529ff237ecd4408bb1e9b04%22%3A%7B%22socketConnect%22%3A%221%22%2C%22connectDomain%22%3A%22liepin.com%22%7D%7D; fe_im_socketSequence_new_0=9_9_6; __session_seq=19; __uv_seq=5; _ga_54YTJKWN86=GS1.1.1684214104.5.1.1684214229.0.0.0; fe_im_opened_pages=_1683876536782',\n",
    "    'Host':'api-c.liepin.com',\n",
    "    'Origin':'https://www.liepin.com',\n",
    "    'Referer':'https://www.liepin.com/',\n",
    "    'Sec-Ch-Ua':'\"Google Chrome\";v=\"113\", \"Chromium\";v=\"113\", \"Not-A.Brand\";v=\"24\"',\n",
    "    'Sec-Ch-Ua-Mobile':'?0',\n",
    "    'Sec-Ch-Ua-Platform':'\"Windows\"',\n",
    "    'Sec-Fetch-Dest':'empty',\n",
    "    'Sec-Fetch-Mode':'cors',\n",
    "    'Sec-Fetch-Site':'same-site',\n",
    "    'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/113.0.0.0 Safari/537.36',\n",
    "    'X-Client-Type':'web',\n",
    "    'X-Fscp-Bi-Stat':'{\"location\": \"https://www.liepin.com/zhaopin/?city=410&dq=410&pubTime=&currentPage=0&pageSize=40&key=%E6%96%B0%E5%AA%92%E4%BD%93%E8%BF%90%E8%90%A5&suggestTag=&workYearCode=1&compId=&compName=&compTag=&industry=&salary=&jobKind=&compScale=&compKind=&compStage=&eduLevel=&otherCity=&ckId=m115ee66gzyoe0871yajsc5ijixjuoc8&scene=input&skId=m115ee66gzyoe0871yajsc5ijixjuoc8&fkId=m115ee66gzyoe0871yajsc5ijixjuoc8&sfrom=search_job_pc&suggestId=\"}',\n",
    "    'X-Fscp-Fe-Version': '',\n",
    "    'X-Fscp-Std-Info': '{\"client_id\": \"40108\"}',\n",
    "    'X-Fscp-Trace-Id':'32822db8-83c1-461f-bd0a-9f83c35b2b4c',\n",
    "    'X-Fscp-Version': '1.1',\n",
    "    'X-Requested-With': 'XMLHttpRequest',\n",
    "    'X-XSRF-TOKEN': 'dQmzmiAWSqiDPe788r3rxg'\n",
    "}\n",
    "\n",
    "# send a POST request with headers\n",
    "r = requests.post(url, data=json.dumps(payload), headers=headers)\n",
    "\n",
    "# extract the JSON data from the response\n",
    "response_data = r.json()\n",
    "\n",
    "# example: print the number of job postings returned\n",
    "print(response_data)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 1,
   "id": "c155abc0",
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 168,
   "id": "290e827b",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>dataInfo</th>\n",
       "      <th>dataParams</th>\n",
       "      <th>comp.compIndustry</th>\n",
       "      <th>comp.compId</th>\n",
       "      <th>comp.compLogo</th>\n",
       "      <th>comp.compName</th>\n",
       "      <th>comp.link</th>\n",
       "      <th>comp.compScale</th>\n",
       "      <th>recruiter.imId</th>\n",
       "      <th>...</th>\n",
       "      <th>job.topJob</th>\n",
       "      <th>job.title</th>\n",
       "      <th>job.pcOuterLink</th>\n",
       "      <th>job.h5OuterLink</th>\n",
       "      <th>job.link</th>\n",
       "      <th>job.campusJobKind</th>\n",
       "      <th>job.dataPromId</th>\n",
       "      <th>comp.compStage</th>\n",
       "      <th>job.requireWorkYears</th>\n",
       "      <th>job.requireEduLevel</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"d4220742abc67c8c66070057dda5d09e\",\"...</td>\n",
       "      <td>批发/零售</td>\n",
       "      <td>12587363.0</td>\n",
       "      <td>603b342d5acef567b702eac007u.jpg</td>\n",
       "      <td>广州市拓植文化传播有限公司</td>\n",
       "      <td>https://www.liepin.com/company/12587363/</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>8c27dae32e9b17a9ac365a663ca833da</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://www.liepin.com/lptjob/36944041</td>\n",
       "      <td>应届</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=0&amp;d...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"da8cc60122dd16261d76b074084784e4\",\"...</td>\n",
       "      <td>家政服务</td>\n",
       "      <td>12565395.0</td>\n",
       "      <td>612d9c1b3d9300348516339803u.jpg</td>\n",
       "      <td>慢会所</td>\n",
       "      <td>https://www.liepin.com/company/12565395/</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>3f635980fd134cdacb203885796dc433</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://www.liepin.com/lptjob/42741455</td>\n",
       "      <td>应届</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=0&amp;d...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"831c925dea3fb8a6090b6ac457f5ea52\",\"...</td>\n",
       "      <td>互联网</td>\n",
       "      <td>8476411.0</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>广州市学晟惠信息科技有限公司</td>\n",
       "      <td>https://www.liepin.com/company/8476411/</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>fdd08052cb5eb4b3448d0695f9e5436a</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://www.liepin.com/lptjob/58332313</td>\n",
       "      <td>应届</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=0&amp;d...</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"d7e40bf2c6c9f9cc1ace31e5dccd07e9\",\"...</td>\n",
       "      <td>其他商务服务业</td>\n",
       "      <td>13513523.0</td>\n",
       "      <td>61b07937d0458d53c627567e02u.jpg</td>\n",
       "      <td>广州花林知行研学旅行服务有限公司</td>\n",
       "      <td>https://www.liepin.com/company/13513523/</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>315f2e2357f8b2a9cd120ce14494f73d</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://www.liepin.com/lptjob/57929205</td>\n",
       "      <td>应届</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=0&amp;d...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>%7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...</td>\n",
       "      <td>{\"userId\":\"e9ae0c6d35b77d020104d2aba3164681\",\"...</td>\n",
       "      <td>生活服务O2O</td>\n",
       "      <td>8854855.0</td>\n",
       "      <td>59bb74a770328eecdbaf843704a.png</td>\n",
       "      <td>蜂助手股份有限公司</td>\n",
       "      <td>https://www.liepin.com/company/8854855/</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>f9981e992d8231169f90a7bcfdb96d0e</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>新媒体运营（应届生或实习生）</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://www.liepin.com/lptjob/56775649</td>\n",
       "      <td>应届</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=0&amp;d...</td>\n",
       "      <td>融资未公开</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>35</td>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"李女士\",\"userId\":\"113f650d99b2f...</td>\n",
       "      <td>日化</td>\n",
       "      <td>1998001.0</td>\n",
       "      <td>5c6a4ab5509919c4f5f533a302u.png</td>\n",
       "      <td>立白集团</td>\n",
       "      <td>https://www.liepin.com/company/1998001/</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>f0f95114bc85316bbefa578784e31c32</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>新媒体运营（有丛气）</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://www.liepin.com/job/1956588071.shtml</td>\n",
       "      <td>NaN</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=19&amp;...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>大专</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>36</td>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"董女士\",\"userId\":\"a6bdeb2e6f03d...</td>\n",
       "      <td>房地产开发经营</td>\n",
       "      <td>NaN</td>\n",
       "      <td>60e2fe0bf3df194a3c48adb502u.png</td>\n",
       "      <td>某知名公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>d145a0c18f71c2b0063dfc1b00f6daab</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>新媒体运营专员</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://www.liepin.com/a/45719301.shtml</td>\n",
       "      <td>NaN</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=19&amp;...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>大专及以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>37</td>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"宋女士\",\"userId\":\"9f229bd577e8d...</td>\n",
       "      <td>货运/物流/仓储</td>\n",
       "      <td>NaN</td>\n",
       "      <td>60e2fe0bf3df194a3c48adb502u.png</td>\n",
       "      <td>某广州大型货运/物流/仓储公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>9e6539b6024d733f9f90a7bcfdb96d0e</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>新媒体运营岗</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://www.liepin.com/a/45725809.shtml</td>\n",
       "      <td>NaN</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=19&amp;...</td>\n",
       "      <td>已上市</td>\n",
       "      <td>3-5年</td>\n",
       "      <td>统招本科</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>38</td>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"唐女士\",\"userId\":\"cab5da268eb2e...</td>\n",
       "      <td>智能硬件</td>\n",
       "      <td>NaN</td>\n",
       "      <td>60e2fe0bf3df194a3c48adb502u.png</td>\n",
       "      <td>某国内智能硬件公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>b2e04f81dcc7c0be5ad960e36627eac9</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://www.liepin.com/a/45439065.shtml</td>\n",
       "      <td>NaN</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=19&amp;...</td>\n",
       "      <td>A轮</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>统招本科</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>39</td>\n",
       "      <td>%7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...</td>\n",
       "      <td>{\"recruiterName\":\"余先生\",\"userId\":\"9596dfe683c47...</td>\n",
       "      <td>计算机软件</td>\n",
       "      <td>NaN</td>\n",
       "      <td>60e2fe0bf3df194a3c48adb502u.png</td>\n",
       "      <td>某广州计算机软件公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>3df7086d47038591c6ad1568e455f51a</td>\n",
       "      <td>...</td>\n",
       "      <td>False</td>\n",
       "      <td>新媒体运营（公众号、Facebook、titok）</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>https://www.liepin.com/a/45449227.shtml</td>\n",
       "      <td>NaN</td>\n",
       "      <td>d_sfrom=search_prime&amp;d_ckId=null&amp;d_curPage=19&amp;...</td>\n",
       "      <td>不需要融资</td>\n",
       "      <td>1-3年</td>\n",
       "      <td>本科及以上</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 33 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0                                           dataInfo  \\\n",
       "0             0  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "1             1  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "2             2  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "3             3  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "4             4  %7B%22ckId%22%3A%22h2c8pxojavrmo1w785z7ueih2yb...   \n",
       "..          ...                                                ...   \n",
       "795          35  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "796          36  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "797          37  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "798          38  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "799          39  %7B%22sfrom%22%3A%22search_job_pc%22%2C%22jobK...   \n",
       "\n",
       "                                            dataParams comp.compIndustry  \\\n",
       "0    {\"userId\":\"d4220742abc67c8c66070057dda5d09e\",\"...             批发/零售   \n",
       "1    {\"userId\":\"da8cc60122dd16261d76b074084784e4\",\"...              家政服务   \n",
       "2    {\"userId\":\"831c925dea3fb8a6090b6ac457f5ea52\",\"...               互联网   \n",
       "3    {\"userId\":\"d7e40bf2c6c9f9cc1ace31e5dccd07e9\",\"...           其他商务服务业   \n",
       "4    {\"userId\":\"e9ae0c6d35b77d020104d2aba3164681\",\"...           生活服务O2O   \n",
       "..                                                 ...               ...   \n",
       "795  {\"recruiterName\":\"李女士\",\"userId\":\"113f650d99b2f...                日化   \n",
       "796  {\"recruiterName\":\"董女士\",\"userId\":\"a6bdeb2e6f03d...           房地产开发经营   \n",
       "797  {\"recruiterName\":\"宋女士\",\"userId\":\"9f229bd577e8d...          货运/物流/仓储   \n",
       "798  {\"recruiterName\":\"唐女士\",\"userId\":\"cab5da268eb2e...              智能硬件   \n",
       "799  {\"recruiterName\":\"余先生\",\"userId\":\"9596dfe683c47...             计算机软件   \n",
       "\n",
       "     comp.compId                    comp.compLogo     comp.compName  \\\n",
       "0     12587363.0  603b342d5acef567b702eac007u.jpg     广州市拓植文化传播有限公司   \n",
       "1     12565395.0  612d9c1b3d9300348516339803u.jpg               慢会所   \n",
       "2      8476411.0  61b07937d0458d53c627567e02u.jpg    广州市学晟惠信息科技有限公司   \n",
       "3     13513523.0  61b07937d0458d53c627567e02u.jpg  广州花林知行研学旅行服务有限公司   \n",
       "4      8854855.0  59bb74a770328eecdbaf843704a.png         蜂助手股份有限公司   \n",
       "..           ...                              ...               ...   \n",
       "795    1998001.0  5c6a4ab5509919c4f5f533a302u.png              立白集团   \n",
       "796          NaN  60e2fe0bf3df194a3c48adb502u.png             某知名公司   \n",
       "797          NaN  60e2fe0bf3df194a3c48adb502u.png   某广州大型货运/物流/仓储公司   \n",
       "798          NaN  60e2fe0bf3df194a3c48adb502u.png         某国内智能硬件公司   \n",
       "799          NaN  60e2fe0bf3df194a3c48adb502u.png        某广州计算机软件公司   \n",
       "\n",
       "                                    comp.link comp.compScale  \\\n",
       "0    https://www.liepin.com/company/12587363/          1-49人   \n",
       "1    https://www.liepin.com/company/12565395/          1-49人   \n",
       "2     https://www.liepin.com/company/8476411/          1-49人   \n",
       "3    https://www.liepin.com/company/13513523/          1-49人   \n",
       "4     https://www.liepin.com/company/8854855/       100-499人   \n",
       "..                                        ...            ...   \n",
       "795   https://www.liepin.com/company/1998001/       10000人以上   \n",
       "796                                       NaN            NaN   \n",
       "797                                       NaN       10000人以上   \n",
       "798                                       NaN         50-99人   \n",
       "799                                       NaN       100-499人   \n",
       "\n",
       "                       recruiter.imId  ...  job.topJob  \\\n",
       "0    8c27dae32e9b17a9ac365a663ca833da  ...       False   \n",
       "1    3f635980fd134cdacb203885796dc433  ...       False   \n",
       "2    fdd08052cb5eb4b3448d0695f9e5436a  ...       False   \n",
       "3    315f2e2357f8b2a9cd120ce14494f73d  ...       False   \n",
       "4    f9981e992d8231169f90a7bcfdb96d0e  ...       False   \n",
       "..                                ...  ...         ...   \n",
       "795  f0f95114bc85316bbefa578784e31c32  ...       False   \n",
       "796  d145a0c18f71c2b0063dfc1b00f6daab  ...       False   \n",
       "797  9e6539b6024d733f9f90a7bcfdb96d0e  ...       False   \n",
       "798  b2e04f81dcc7c0be5ad960e36627eac9  ...       False   \n",
       "799  3df7086d47038591c6ad1568e455f51a  ...       False   \n",
       "\n",
       "                     job.title job.pcOuterLink  job.h5OuterLink  \\\n",
       "0                     新媒体运营实习生             NaN              NaN   \n",
       "1                     新媒体运营实习生             NaN              NaN   \n",
       "2                     新媒体运营实习生             NaN              NaN   \n",
       "3                        新媒体运营             NaN              NaN   \n",
       "4               新媒体运营（应届生或实习生）             NaN              NaN   \n",
       "..                         ...             ...              ...   \n",
       "795                 新媒体运营（有丛气）             NaN              NaN   \n",
       "796                    新媒体运营专员             NaN              NaN   \n",
       "797                     新媒体运营岗             NaN              NaN   \n",
       "798                      新媒体运营             NaN              NaN   \n",
       "799  新媒体运营（公众号、Facebook、titok）             NaN              NaN   \n",
       "\n",
       "                                        job.link job.campusJobKind  \\\n",
       "0         https://www.liepin.com/lptjob/36944041                应届   \n",
       "1         https://www.liepin.com/lptjob/42741455                应届   \n",
       "2         https://www.liepin.com/lptjob/58332313                应届   \n",
       "3         https://www.liepin.com/lptjob/57929205                应届   \n",
       "4         https://www.liepin.com/lptjob/56775649                应届   \n",
       "..                                           ...               ...   \n",
       "795  https://www.liepin.com/job/1956588071.shtml               NaN   \n",
       "796      https://www.liepin.com/a/45719301.shtml               NaN   \n",
       "797      https://www.liepin.com/a/45725809.shtml               NaN   \n",
       "798      https://www.liepin.com/a/45439065.shtml               NaN   \n",
       "799      https://www.liepin.com/a/45449227.shtml               NaN   \n",
       "\n",
       "                                        job.dataPromId comp.compStage  \\\n",
       "0    d_sfrom=search_prime&d_ckId=null&d_curPage=0&d...            NaN   \n",
       "1    d_sfrom=search_prime&d_ckId=null&d_curPage=0&d...            NaN   \n",
       "2    d_sfrom=search_prime&d_ckId=null&d_curPage=0&d...          融资未公开   \n",
       "3    d_sfrom=search_prime&d_ckId=null&d_curPage=0&d...            NaN   \n",
       "4    d_sfrom=search_prime&d_ckId=null&d_curPage=0&d...          融资未公开   \n",
       "..                                                 ...            ...   \n",
       "795  d_sfrom=search_prime&d_ckId=null&d_curPage=19&...            NaN   \n",
       "796  d_sfrom=search_prime&d_ckId=null&d_curPage=19&...            NaN   \n",
       "797  d_sfrom=search_prime&d_ckId=null&d_curPage=19&...            已上市   \n",
       "798  d_sfrom=search_prime&d_ckId=null&d_curPage=19&...             A轮   \n",
       "799  d_sfrom=search_prime&d_ckId=null&d_curPage=19&...          不需要融资   \n",
       "\n",
       "    job.requireWorkYears  job.requireEduLevel  \n",
       "0                    NaN                  NaN  \n",
       "1                    NaN                  NaN  \n",
       "2                    NaN                  NaN  \n",
       "3                    NaN                  NaN  \n",
       "4                    NaN                  NaN  \n",
       "..                   ...                  ...  \n",
       "795                 1-3年                   大专  \n",
       "796                 1-3年                大专及以上  \n",
       "797                 3-5年                 统招本科  \n",
       "798                 1-3年                 统招本科  \n",
       "799                 1-3年                本科及以上  \n",
       "\n",
       "[800 rows x 33 columns]"
      ]
     },
     "execution_count": 168,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.read_excel('../week12/liepin_PM_0516.xlsx')\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 169,
   "id": "d9eeb5c3",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>job.title</th>\n",
       "      <th>job.salary</th>\n",
       "      <th>job.dq</th>\n",
       "      <th>comp.compName</th>\n",
       "      <th>comp.compScale</th>\n",
       "      <th>job.labels</th>\n",
       "      <th>job.requireEduLevel</th>\n",
       "      <th>comp.compIndustry</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>3-5k</td>\n",
       "      <td>广州</td>\n",
       "      <td>广州市拓植文化传播有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>批发/零售</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>4-7k</td>\n",
       "      <td>广州</td>\n",
       "      <td>慢会所</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '新媒体运营']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>家政服务</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>5-8k</td>\n",
       "      <td>广州-番禺区</td>\n",
       "      <td>广州市学晟惠信息科技有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>互联网</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>2-4k</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>广州花林知行研学旅行服务有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>其他商务服务业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>新媒体运营（应届生或实习生）</td>\n",
       "      <td>7-10k</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>蜂助手股份有限公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['本科']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>生活服务O2O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>新媒体运营（有丛气）</td>\n",
       "      <td>9-15k·13薪</td>\n",
       "      <td>广州-荔湾区</td>\n",
       "      <td>立白集团</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']</td>\n",
       "      <td>大专</td>\n",
       "      <td>日化</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>新媒体运营专员</td>\n",
       "      <td>8-13k·13薪</td>\n",
       "      <td>广州</td>\n",
       "      <td>某知名公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>房地产开发经营</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>新媒体运营岗</td>\n",
       "      <td>20-35k</td>\n",
       "      <td>广州-白云区</td>\n",
       "      <td>某广州大型货运/物流/仓储公司</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>货运/物流/仓储</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>15-23k·14薪</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>某国内智能硬件公司</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>['新媒体运营', '活动运营', '线上运营', '抖音平台']</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>智能硬件</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>新媒体运营（公众号、Facebook、titok）</td>\n",
       "      <td>10-15k</td>\n",
       "      <td>广州</td>\n",
       "      <td>某广州计算机软件公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>计算机软件</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                     job.title  job.salary  job.dq     comp.compName  \\\n",
       "0                     新媒体运营实习生        3-5k      广州     广州市拓植文化传播有限公司   \n",
       "1                     新媒体运营实习生        4-7k      广州               慢会所   \n",
       "2                     新媒体运营实习生        5-8k  广州-番禺区    广州市学晟惠信息科技有限公司   \n",
       "3                        新媒体运营        2-4k  广州-海珠区  广州花林知行研学旅行服务有限公司   \n",
       "4               新媒体运营（应届生或实习生）       7-10k  广州-天河区         蜂助手股份有限公司   \n",
       "..                         ...         ...     ...               ...   \n",
       "795                 新媒体运营（有丛气）   9-15k·13薪  广州-荔湾区              立白集团   \n",
       "796                    新媒体运营专员   8-13k·13薪      广州             某知名公司   \n",
       "797                     新媒体运营岗      20-35k  广州-白云区   某广州大型货运/物流/仓储公司   \n",
       "798                      新媒体运营  15-23k·14薪  广州-海珠区         某国内智能硬件公司   \n",
       "799  新媒体运营（公众号、Facebook、titok）      10-15k      广州        某广州计算机软件公司   \n",
       "\n",
       "    comp.compScale                                         job.labels  \\\n",
       "0            1-49人  ['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...   \n",
       "1            1-49人                                    ['本科', '新媒体运营']   \n",
       "2            1-49人  ['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...   \n",
       "3            1-49人                                             ['大专']   \n",
       "4         100-499人                                             ['本科']   \n",
       "..             ...                                                ...   \n",
       "795       10000人以上                ['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']   \n",
       "796            NaN  ['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...   \n",
       "797       10000人以上  ['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...   \n",
       "798         50-99人                  ['新媒体运营', '活动运营', '线上运营', '抖音平台']   \n",
       "799       100-499人     ['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']   \n",
       "\n",
       "    job.requireEduLevel comp.compIndustry  \n",
       "0                   NaN             批发/零售  \n",
       "1                   NaN              家政服务  \n",
       "2                   NaN               互联网  \n",
       "3                   NaN           其他商务服务业  \n",
       "4                   NaN           生活服务O2O  \n",
       "..                  ...               ...  \n",
       "795                  大专                日化  \n",
       "796               大专及以上           房地产开发经营  \n",
       "797                统招本科          货运/物流/仓储  \n",
       "798                统招本科              智能硬件  \n",
       "799               本科及以上             计算机软件  \n",
       "\n",
       "[800 rows x 8 columns]"
      ]
     },
     "execution_count": 169,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_sx=  df[['job.title','job.salary','job.dq','comp.compName','comp.compScale','job.labels','job.requireEduLevel','comp.compIndustry']]\n",
    "df_PM_sx"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "id": "f9fbec5c",
   "metadata": {},
   "outputs": [],
   "source": [
    "# 分组运算"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "id": "a6d611fd",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "本科       265\n",
       "大专       259\n",
       "学历不限      89\n",
       "统招本科      47\n",
       "中专/中技     21\n",
       "大专及以上      5\n",
       "硕士         4\n",
       "本科及以上      4\n",
       "初中         1\n",
       "Name: job.requireEduLevel, dtype: int64"
      ]
     },
     "execution_count": 11,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_sx['job.requireEduLevel'].value_counts()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "id": "9f2d8b74",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>comp.compName</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>job.requireEduLevel</th>\n",
       "      <th>comp.compScale</th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">中专/中技</th>\n",
       "      <th>1-49人</th>\n",
       "      <td>13</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>100-499人</th>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>初中</th>\n",
       "      <th>500-999人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"8\" valign=\"top\">大专</th>\n",
       "      <th>1-49人</th>\n",
       "      <td>109</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>100-499人</th>\n",
       "      <td>46</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1000-2000人</th>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10000人以上</th>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2000-5000人</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>54</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>500-999人</th>\n",
       "      <td>17</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5000-10000人</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">大专及以上</th>\n",
       "      <th>500-999人</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5000-10000人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">学历不限</th>\n",
       "      <th>1-49人</th>\n",
       "      <td>38</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>100-499人</th>\n",
       "      <td>13</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2000-5000人</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>26</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>500-999人</th>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5000-10000人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"8\" valign=\"top\">本科</th>\n",
       "      <th>1-49人</th>\n",
       "      <td>99</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>100-499人</th>\n",
       "      <td>43</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1000-2000人</th>\n",
       "      <td>14</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10000人以上</th>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2000-5000人</th>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>52</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>500-999人</th>\n",
       "      <td>14</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5000-10000人</th>\n",
       "      <td>10</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">本科及以上</th>\n",
       "      <th>100-499人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5000-10000人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">硕士</th>\n",
       "      <th>1-49人</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2000-5000人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"8\" valign=\"top\">统招本科</th>\n",
       "      <th>1-49人</th>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>100-499人</th>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1000-2000人</th>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10000人以上</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2000-5000人</th>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>500-999人</th>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5000-10000人</th>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                    comp.compName\n",
       "job.requireEduLevel comp.compScale               \n",
       "中专/中技               1-49人                      13\n",
       "                    100-499人                    5\n",
       "                    50-99人                      2\n",
       "初中                  500-999人                    1\n",
       "大专                  1-49人                     109\n",
       "                    100-499人                   46\n",
       "                    1000-2000人                  8\n",
       "                    10000人以上                    6\n",
       "                    2000-5000人                  2\n",
       "                    50-99人                     54\n",
       "                    500-999人                   17\n",
       "                    5000-10000人                 2\n",
       "大专及以上               500-999人                    2\n",
       "                    5000-10000人                 1\n",
       "学历不限                1-49人                      38\n",
       "                    100-499人                   13\n",
       "                    2000-5000人                  2\n",
       "                    50-99人                     26\n",
       "                    500-999人                    4\n",
       "                    5000-10000人                 1\n",
       "本科                  1-49人                      99\n",
       "                    100-499人                   43\n",
       "                    1000-2000人                 14\n",
       "                    10000人以上                    8\n",
       "                    2000-5000人                  8\n",
       "                    50-99人                     52\n",
       "                    500-999人                   14\n",
       "                    5000-10000人                10\n",
       "本科及以上               100-499人                    1\n",
       "                    50-99人                      1\n",
       "                    5000-10000人                 1\n",
       "硕士                  1-49人                       2\n",
       "                    2000-5000人                  1\n",
       "                    50-99人                      1\n",
       "统招本科                1-49人                       6\n",
       "                    100-499人                    8\n",
       "                    1000-2000人                  4\n",
       "                    10000人以上                    2\n",
       "                    2000-5000人                  6\n",
       "                    50-99人                      7\n",
       "                    500-999人                    6\n",
       "                    5000-10000人                 5"
      ]
     },
     "execution_count": 12,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_sx.groupby(['job.requireEduLevel','comp.compScale']).agg({'comp.compName':'count'})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "4ff83090",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "id": "ef5472df",
   "metadata": {
    "scrolled": false
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th></th>\n",
       "      <th>comp.compName</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>job.requireEduLevel</th>\n",
       "      <th>comp.compScale</th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">中专/中技</th>\n",
       "      <th>1-49人</th>\n",
       "      <td>13</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>100-499人</th>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>初中</th>\n",
       "      <th>500-999人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"8\" valign=\"top\">大专</th>\n",
       "      <th>1-49人</th>\n",
       "      <td>109</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>100-499人</th>\n",
       "      <td>46</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1000-2000人</th>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10000人以上</th>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2000-5000人</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>54</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>500-999人</th>\n",
       "      <td>17</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5000-10000人</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"2\" valign=\"top\">大专及以上</th>\n",
       "      <th>500-999人</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5000-10000人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"6\" valign=\"top\">学历不限</th>\n",
       "      <th>1-49人</th>\n",
       "      <td>38</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>100-499人</th>\n",
       "      <td>13</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2000-5000人</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>26</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>500-999人</th>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5000-10000人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"8\" valign=\"top\">本科</th>\n",
       "      <th>1-49人</th>\n",
       "      <td>99</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>100-499人</th>\n",
       "      <td>43</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1000-2000人</th>\n",
       "      <td>14</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10000人以上</th>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2000-5000人</th>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>52</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>500-999人</th>\n",
       "      <td>14</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5000-10000人</th>\n",
       "      <td>10</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">本科及以上</th>\n",
       "      <th>100-499人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5000-10000人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"3\" valign=\"top\">硕士</th>\n",
       "      <th>1-49人</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2000-5000人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>1</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th rowspan=\"8\" valign=\"top\">统招本科</th>\n",
       "      <th>1-49人</th>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>100-499人</th>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1000-2000人</th>\n",
       "      <td>4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10000人以上</th>\n",
       "      <td>2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2000-5000人</th>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50-99人</th>\n",
       "      <td>7</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>500-999人</th>\n",
       "      <td>6</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5000-10000人</th>\n",
       "      <td>5</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                    comp.compName\n",
       "job.requireEduLevel comp.compScale               \n",
       "中专/中技               1-49人                      13\n",
       "                    100-499人                    5\n",
       "                    50-99人                      2\n",
       "初中                  500-999人                    1\n",
       "大专                  1-49人                     109\n",
       "                    100-499人                   46\n",
       "                    1000-2000人                  8\n",
       "                    10000人以上                    6\n",
       "                    2000-5000人                  2\n",
       "                    50-99人                     54\n",
       "                    500-999人                   17\n",
       "                    5000-10000人                 2\n",
       "大专及以上               500-999人                    2\n",
       "                    5000-10000人                 1\n",
       "学历不限                1-49人                      38\n",
       "                    100-499人                   13\n",
       "                    2000-5000人                  2\n",
       "                    50-99人                     26\n",
       "                    500-999人                    4\n",
       "                    5000-10000人                 1\n",
       "本科                  1-49人                      99\n",
       "                    100-499人                   43\n",
       "                    1000-2000人                 14\n",
       "                    10000人以上                    8\n",
       "                    2000-5000人                  8\n",
       "                    50-99人                     52\n",
       "                    500-999人                   14\n",
       "                    5000-10000人                10\n",
       "本科及以上               100-499人                    1\n",
       "                    50-99人                      1\n",
       "                    5000-10000人                 1\n",
       "硕士                  1-49人                       2\n",
       "                    2000-5000人                  1\n",
       "                    50-99人                      1\n",
       "统招本科                1-49人                       6\n",
       "                    100-499人                    8\n",
       "                    1000-2000人                  4\n",
       "                    10000人以上                    2\n",
       "                    2000-5000人                  6\n",
       "                    50-99人                      7\n",
       "                    500-999人                    6\n",
       "                    5000-10000人                 5"
      ]
     },
     "execution_count": 33,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "学历分组 = df_PM_sx.groupby(['job.requireEduLevel','comp.compScale']).agg({'comp.compName':'count'})\n",
    "学历分组"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "id": "2b1afc3f",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>学历</th>\n",
       "      <th>规模</th>\n",
       "      <th>人数</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>本科</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>99</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>本科</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>43</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>本科</td>\n",
       "      <td>1000-2000人</td>\n",
       "      <td>14</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>本科</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>本科</td>\n",
       "      <td>2000-5000人</td>\n",
       "      <td>8</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>本科</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>52</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>本科</td>\n",
       "      <td>500-999人</td>\n",
       "      <td>14</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>本科</td>\n",
       "      <td>5000-10000人</td>\n",
       "      <td>10</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    学历           规模  人数\n",
       "20  本科        1-49人  99\n",
       "21  本科     100-499人  43\n",
       "22  本科   1000-2000人  14\n",
       "23  本科     10000人以上   8\n",
       "24  本科   2000-5000人   8\n",
       "25  本科       50-99人  52\n",
       "26  本科     500-999人  14\n",
       "27  本科  5000-10000人  10"
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "本科 = 学历分组.reset_index()\\\n",
    "    .rename(columns ={'job.requireEduLevel':'学历','comp.compScale':'规模','comp.compName':'人数'})\\\n",
    "    .query('学历==\"本科\"')\n",
    "本科"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "id": "79defdcf",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "\n",
       "<script>\n",
       "    require.config({\n",
       "        paths: {\n",
       "            'echarts':'https://assets.pyecharts.org/assets/v5/echarts.min'\n",
       "        }\n",
       "    });\n",
       "</script>\n",
       "\n",
       "        <div id=\"5f579ca627514079a4013a93a577094d\" style=\"width:900px; height:500px;\"></div>\n",
       "\n",
       "<script>\n",
       "        require(['echarts'], function(echarts) {\n",
       "                var chart_5f579ca627514079a4013a93a577094d = echarts.init(\n",
       "                    document.getElementById('5f579ca627514079a4013a93a577094d'), 'white', {renderer: 'canvas'});\n",
       "                var option_5f579ca627514079a4013a93a577094d = {\n",
       "    \"backgroundColor\": \"#2c343c\",\n",
       "    \"animation\": true,\n",
       "    \"animationThreshold\": 2000,\n",
       "    \"animationDuration\": 1000,\n",
       "    \"animationEasing\": \"cubicOut\",\n",
       "    \"animationDelay\": 0,\n",
       "    \"animationDurationUpdate\": 300,\n",
       "    \"animationEasingUpdate\": \"cubicOut\",\n",
       "    \"animationDelayUpdate\": 0,\n",
       "    \"aria\": {\n",
       "        \"enabled\": false\n",
       "    },\n",
       "    \"color\": [\n",
       "        \"#5470c6\",\n",
       "        \"#91cc75\",\n",
       "        \"#fac858\",\n",
       "        \"#ee6666\",\n",
       "        \"#73c0de\",\n",
       "        \"#3ba272\",\n",
       "        \"#fc8452\",\n",
       "        \"#9a60b4\",\n",
       "        \"#ea7ccc\"\n",
       "    ],\n",
       "    \"series\": [\n",
       "        {\n",
       "            \"type\": \"pie\",\n",
       "            \"name\": \"\\u8bbf\\u95ee\\u6765\\u6e90\",\n",
       "            \"colorBy\": \"data\",\n",
       "            \"legendHoverLink\": true,\n",
       "            \"selectedMode\": false,\n",
       "            \"selectedOffset\": 10,\n",
       "            \"clockwise\": true,\n",
       "            \"startAngle\": 90,\n",
       "            \"minAngle\": 0,\n",
       "            \"minShowLabelAngle\": 0,\n",
       "            \"avoidLabelOverlap\": true,\n",
       "            \"stillShowZeroSum\": true,\n",
       "            \"percentPrecision\": 2,\n",
       "            \"showEmptyCircle\": true,\n",
       "            \"emptyCircleStyle\": {\n",
       "                \"color\": \"lightgray\",\n",
       "                \"borderColor\": \"#000\",\n",
       "                \"borderWidth\": 0,\n",
       "                \"borderType\": \"solid\",\n",
       "                \"borderDashOffset\": 0,\n",
       "                \"borderCap\": \"butt\",\n",
       "                \"borderJoin\": \"bevel\",\n",
       "                \"borderMiterLimit\": 10,\n",
       "                \"opacity\": 1\n",
       "            },\n",
       "            \"data\": [\n",
       "                {\n",
       "                    \"name\": \"10000\\u4eba\\u4ee5\\u4e0a\",\n",
       "                    \"value\": 8\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"2000-5000\\u4eba\",\n",
       "                    \"value\": 8\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"5000-10000\\u4eba\",\n",
       "                    \"value\": 10\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"1000-2000\\u4eba\",\n",
       "                    \"value\": 14\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"500-999\\u4eba\",\n",
       "                    \"value\": 14\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"100-499\\u4eba\",\n",
       "                    \"value\": 43\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"50-99\\u4eba\",\n",
       "                    \"value\": 52\n",
       "                },\n",
       "                {\n",
       "                    \"name\": \"1-49\\u4eba\",\n",
       "                    \"value\": 99\n",
       "                }\n",
       "            ],\n",
       "            \"radius\": \"55%\",\n",
       "            \"center\": [\n",
       "                \"50%\",\n",
       "                \"50%\"\n",
       "            ],\n",
       "            \"roseType\": \"radius\",\n",
       "            \"label\": {\n",
       "                \"show\": true,\n",
       "                \"color\": \"rgba(255, 255, 255, 0.3)\",\n",
       "                \"margin\": 8\n",
       "            },\n",
       "            \"labelLine\": {\n",
       "                \"show\": true,\n",
       "                \"showAbove\": false,\n",
       "                \"length\": 15,\n",
       "                \"length2\": 15,\n",
       "                \"smooth\": false,\n",
       "                \"minTurnAngle\": 90,\n",
       "                \"maxSurfaceAngle\": 90\n",
       "            },\n",
       "            \"tooltip\": {\n",
       "                \"show\": true,\n",
       "                \"trigger\": \"item\",\n",
       "                \"triggerOn\": \"mousemove|click\",\n",
       "                \"axisPointer\": {\n",
       "                    \"type\": \"line\"\n",
       "                },\n",
       "                \"showContent\": true,\n",
       "                \"alwaysShowContent\": false,\n",
       "                \"showDelay\": 0,\n",
       "                \"hideDelay\": 100,\n",
       "                \"enterable\": false,\n",
       "                \"confine\": false,\n",
       "                \"appendToBody\": false,\n",
       "                \"transitionDuration\": 0.4,\n",
       "                \"formatter\": \"{a} <br/>{b}: {c} ({d}%)\",\n",
       "                \"textStyle\": {\n",
       "                    \"fontSize\": 14\n",
       "                },\n",
       "                \"borderWidth\": 0,\n",
       "                \"padding\": 5,\n",
       "                \"order\": \"seriesAsc\"\n",
       "            },\n",
       "            \"rippleEffect\": {\n",
       "                \"show\": true,\n",
       "                \"brushType\": \"stroke\",\n",
       "                \"scale\": 2.5,\n",
       "                \"period\": 4\n",
       "            }\n",
       "        }\n",
       "    ],\n",
       "    \"legend\": [\n",
       "        {\n",
       "            \"data\": [\n",
       "                \"10000\\u4eba\\u4ee5\\u4e0a\",\n",
       "                \"2000-5000\\u4eba\",\n",
       "                \"5000-10000\\u4eba\",\n",
       "                \"1000-2000\\u4eba\",\n",
       "                \"500-999\\u4eba\",\n",
       "                \"100-499\\u4eba\",\n",
       "                \"50-99\\u4eba\",\n",
       "                \"1-49\\u4eba\"\n",
       "            ],\n",
       "            \"selected\": {},\n",
       "            \"show\": false,\n",
       "            \"padding\": 5,\n",
       "            \"itemGap\": 10,\n",
       "            \"itemWidth\": 25,\n",
       "            \"itemHeight\": 14,\n",
       "            \"backgroundColor\": \"transparent\",\n",
       "            \"borderColor\": \"#ccc\",\n",
       "            \"borderWidth\": 1,\n",
       "            \"borderRadius\": 0,\n",
       "            \"pageButtonItemGap\": 5,\n",
       "            \"pageButtonPosition\": \"end\",\n",
       "            \"pageFormatter\": \"{current}/{total}\",\n",
       "            \"pageIconColor\": \"#2f4554\",\n",
       "            \"pageIconInactiveColor\": \"#aaa\",\n",
       "            \"pageIconSize\": 15,\n",
       "            \"animationDurationUpdate\": 800,\n",
       "            \"selector\": false,\n",
       "            \"selectorPosition\": \"auto\",\n",
       "            \"selectorItemGap\": 7,\n",
       "            \"selectorButtonGap\": 10\n",
       "        }\n",
       "    ],\n",
       "    \"tooltip\": {\n",
       "        \"show\": true,\n",
       "        \"trigger\": \"item\",\n",
       "        \"triggerOn\": \"mousemove|click\",\n",
       "        \"axisPointer\": {\n",
       "            \"type\": \"line\"\n",
       "        },\n",
       "        \"showContent\": true,\n",
       "        \"alwaysShowContent\": false,\n",
       "        \"showDelay\": 0,\n",
       "        \"hideDelay\": 100,\n",
       "        \"enterable\": false,\n",
       "        \"confine\": false,\n",
       "        \"appendToBody\": false,\n",
       "        \"transitionDuration\": 0.4,\n",
       "        \"textStyle\": {\n",
       "            \"fontSize\": 14\n",
       "        },\n",
       "        \"borderWidth\": 0,\n",
       "        \"padding\": 5,\n",
       "        \"order\": \"seriesAsc\"\n",
       "    },\n",
       "    \"title\": [\n",
       "        {\n",
       "            \"show\": true,\n",
       "            \"text\": \"\\u672c\\u79d1\\u4eba\\u6570\",\n",
       "            \"target\": \"blank\",\n",
       "            \"subtarget\": \"blank\",\n",
       "            \"left\": \"center\",\n",
       "            \"top\": \"20\",\n",
       "            \"padding\": 5,\n",
       "            \"itemGap\": 10,\n",
       "            \"textAlign\": \"auto\",\n",
       "            \"textVerticalAlign\": \"auto\",\n",
       "            \"triggerEvent\": false,\n",
       "            \"textStyle\": {\n",
       "                \"color\": \"#fff\"\n",
       "            }\n",
       "        }\n",
       "    ]\n",
       "};\n",
       "                chart_5f579ca627514079a4013a93a577094d.setOption(option_5f579ca627514079a4013a93a577094d);\n",
       "        });\n",
       "    </script>\n"
      ],
      "text/plain": [
       "<pyecharts.render.display.HTML at 0x1d7e7e61d90>"
      ]
     },
     "execution_count": 28,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "import pyecharts.options as opts\n",
    "from pyecharts.charts import Pie\n",
    "\n",
    "\n",
    "x_data = 本科['规模'].values.tolist()\n",
    "y_data = 本科['人数'].values.tolist()\n",
    "data_pair = [list(z) for z in zip(x_data, y_data)]\n",
    "data_pair.sort(key=lambda x: x[1])\n",
    "\n",
    "(\n",
    "    Pie(init_opts=opts.InitOpts(bg_color=\"#2c343c\"))\n",
    "    .add(\n",
    "        series_name=\"访问来源\",\n",
    "        data_pair=data_pair,\n",
    "        rosetype=\"radius\",\n",
    "        radius=\"55%\",\n",
    "        center=[\"50%\", \"50%\"],\n",
    "        label_opts=opts.LabelOpts(is_show=False, position=\"center\"),\n",
    "    )\n",
    "    .set_global_opts(\n",
    "        title_opts=opts.TitleOpts(\n",
    "            title=\"本科人数\",\n",
    "            pos_left=\"center\",\n",
    "            pos_top=\"20\",\n",
    "            title_textstyle_opts=opts.TextStyleOpts(color=\"#fff\"),\n",
    "        ),\n",
    "        legend_opts=opts.LegendOpts(is_show=False),\n",
    "    )\n",
    "    .set_series_opts(\n",
    "        tooltip_opts=opts.TooltipOpts(\n",
    "            trigger=\"item\", formatter=\"{a} <br/>{b}: {c} ({d}%)\"\n",
    "        ),\n",
    "        label_opts=opts.LabelOpts(color=\"rgba(255, 255, 255, 0.3)\"),\n",
    "    )\n",
    "#     .render(\"customized_pie.html\")\n",
    "    .render_notebook()\n",
    ")\n"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "f029c8bf",
   "metadata": {},
   "source": [
    "## 关于薪资的计算"
   ]
  },
  {
   "cell_type": "markdown",
   "id": "1a5cca10",
   "metadata": {},
   "source": [
    "* 关于列名的重命名\n",
    "> 1. df.rename(columns=(name:newname))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 170,
   "id": "fd9bc4a1",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职位</th>\n",
       "      <th>薪资</th>\n",
       "      <th>地区</th>\n",
       "      <th>公司</th>\n",
       "      <th>公司规模</th>\n",
       "      <th>职业标签</th>\n",
       "      <th>学历</th>\n",
       "      <th>行业</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>3-5k</td>\n",
       "      <td>广州</td>\n",
       "      <td>广州市拓植文化传播有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>批发/零售</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>4-7k</td>\n",
       "      <td>广州</td>\n",
       "      <td>慢会所</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '新媒体运营']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>家政服务</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>5-8k</td>\n",
       "      <td>广州-番禺区</td>\n",
       "      <td>广州市学晟惠信息科技有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>互联网</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>2-4k</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>广州花林知行研学旅行服务有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>其他商务服务业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>新媒体运营（应届生或实习生）</td>\n",
       "      <td>7-10k</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>蜂助手股份有限公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['本科']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>生活服务O2O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>新媒体运营（有丛气）</td>\n",
       "      <td>9-15k·13薪</td>\n",
       "      <td>广州-荔湾区</td>\n",
       "      <td>立白集团</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']</td>\n",
       "      <td>大专</td>\n",
       "      <td>日化</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>新媒体运营专员</td>\n",
       "      <td>8-13k·13薪</td>\n",
       "      <td>广州</td>\n",
       "      <td>某知名公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>房地产开发经营</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>新媒体运营岗</td>\n",
       "      <td>20-35k</td>\n",
       "      <td>广州-白云区</td>\n",
       "      <td>某广州大型货运/物流/仓储公司</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>货运/物流/仓储</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>15-23k·14薪</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>某国内智能硬件公司</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>['新媒体运营', '活动运营', '线上运营', '抖音平台']</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>智能硬件</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>新媒体运营（公众号、Facebook、titok）</td>\n",
       "      <td>10-15k</td>\n",
       "      <td>广州</td>\n",
       "      <td>某广州计算机软件公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>计算机软件</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                            职位          薪资      地区                公司  \\\n",
       "0                     新媒体运营实习生        3-5k      广州     广州市拓植文化传播有限公司   \n",
       "1                     新媒体运营实习生        4-7k      广州               慢会所   \n",
       "2                     新媒体运营实习生        5-8k  广州-番禺区    广州市学晟惠信息科技有限公司   \n",
       "3                        新媒体运营        2-4k  广州-海珠区  广州花林知行研学旅行服务有限公司   \n",
       "4               新媒体运营（应届生或实习生）       7-10k  广州-天河区         蜂助手股份有限公司   \n",
       "..                         ...         ...     ...               ...   \n",
       "795                 新媒体运营（有丛气）   9-15k·13薪  广州-荔湾区              立白集团   \n",
       "796                    新媒体运营专员   8-13k·13薪      广州             某知名公司   \n",
       "797                     新媒体运营岗      20-35k  广州-白云区   某广州大型货运/物流/仓储公司   \n",
       "798                      新媒体运营  15-23k·14薪  广州-海珠区         某国内智能硬件公司   \n",
       "799  新媒体运营（公众号、Facebook、titok）      10-15k      广州        某广州计算机软件公司   \n",
       "\n",
       "         公司规模                                               职业标签     学历  \\\n",
       "0       1-49人  ['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...    NaN   \n",
       "1       1-49人                                    ['本科', '新媒体运营']    NaN   \n",
       "2       1-49人  ['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...    NaN   \n",
       "3       1-49人                                             ['大专']    NaN   \n",
       "4    100-499人                                             ['本科']    NaN   \n",
       "..        ...                                                ...    ...   \n",
       "795  10000人以上                ['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']     大专   \n",
       "796       NaN  ['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...  大专及以上   \n",
       "797  10000人以上  ['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...   统招本科   \n",
       "798    50-99人                  ['新媒体运营', '活动运营', '线上运营', '抖音平台']   统招本科   \n",
       "799  100-499人     ['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']  本科及以上   \n",
       "\n",
       "           行业  \n",
       "0       批发/零售  \n",
       "1        家政服务  \n",
       "2         互联网  \n",
       "3     其他商务服务业  \n",
       "4     生活服务O2O  \n",
       "..        ...  \n",
       "795        日化  \n",
       "796   房地产开发经营  \n",
       "797  货运/物流/仓储  \n",
       "798      智能硬件  \n",
       "799     计算机软件  \n",
       "\n",
       "[800 rows x 8 columns]"
      ]
     },
     "execution_count": 170,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "#重命名\n",
    "df_PM_gz = df_PM_sx.rename(columns={\n",
    "        'job.title':'职位',\n",
    "        'job.salary':'薪资',\n",
    "        'job.dq':'地区',\n",
    "        'comp.compName':'公司',\n",
    "        'comp.compScale':'公司规模',\n",
    "        'job.labels':'职业标签',\n",
    "        'job.requireEduLevel':'学历',\n",
    "        'comp.compIndustry':'行业'\n",
    "})\n",
    "df_PM_gz"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 171,
   "id": "83dfb8d0",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职位</th>\n",
       "      <th>薪资</th>\n",
       "      <th>地区</th>\n",
       "      <th>公司</th>\n",
       "      <th>公司规模</th>\n",
       "      <th>职业标签</th>\n",
       "      <th>学历</th>\n",
       "      <th>行业</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>3-5k</td>\n",
       "      <td>广州</td>\n",
       "      <td>广州市拓植文化传播有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>批发/零售</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>4-7k</td>\n",
       "      <td>广州</td>\n",
       "      <td>慢会所</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '新媒体运营']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>家政服务</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>5-8k</td>\n",
       "      <td>广州-番禺区</td>\n",
       "      <td>广州市学晟惠信息科技有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>互联网</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>2-4k</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>广州花林知行研学旅行服务有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>其他商务服务业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>新媒体运营（应届生或实习生）</td>\n",
       "      <td>7-10k</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>蜂助手股份有限公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['本科']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>生活服务O2O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>新媒体运营（有丛气）</td>\n",
       "      <td>9-15k·13薪</td>\n",
       "      <td>广州-荔湾区</td>\n",
       "      <td>立白集团</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']</td>\n",
       "      <td>大专</td>\n",
       "      <td>日化</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>新媒体运营专员</td>\n",
       "      <td>8-13k·13薪</td>\n",
       "      <td>广州</td>\n",
       "      <td>某知名公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>房地产开发经营</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>新媒体运营岗</td>\n",
       "      <td>20-35k</td>\n",
       "      <td>广州-白云区</td>\n",
       "      <td>某广州大型货运/物流/仓储公司</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>货运/物流/仓储</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>15-23k·14薪</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>某国内智能硬件公司</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>['新媒体运营', '活动运营', '线上运营', '抖音平台']</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>智能硬件</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>新媒体运营（公众号、Facebook、titok）</td>\n",
       "      <td>10-15k</td>\n",
       "      <td>广州</td>\n",
       "      <td>某广州计算机软件公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>计算机软件</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>743 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                            职位          薪资      地区                公司  \\\n",
       "0                     新媒体运营实习生        3-5k      广州     广州市拓植文化传播有限公司   \n",
       "1                     新媒体运营实习生        4-7k      广州               慢会所   \n",
       "2                     新媒体运营实习生        5-8k  广州-番禺区    广州市学晟惠信息科技有限公司   \n",
       "3                        新媒体运营        2-4k  广州-海珠区  广州花林知行研学旅行服务有限公司   \n",
       "4               新媒体运营（应届生或实习生）       7-10k  广州-天河区         蜂助手股份有限公司   \n",
       "..                         ...         ...     ...               ...   \n",
       "795                 新媒体运营（有丛气）   9-15k·13薪  广州-荔湾区              立白集团   \n",
       "796                    新媒体运营专员   8-13k·13薪      广州             某知名公司   \n",
       "797                     新媒体运营岗      20-35k  广州-白云区   某广州大型货运/物流/仓储公司   \n",
       "798                      新媒体运营  15-23k·14薪  广州-海珠区         某国内智能硬件公司   \n",
       "799  新媒体运营（公众号、Facebook、titok）      10-15k      广州        某广州计算机软件公司   \n",
       "\n",
       "         公司规模                                               职业标签     学历  \\\n",
       "0       1-49人  ['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...    NaN   \n",
       "1       1-49人                                    ['本科', '新媒体运营']    NaN   \n",
       "2       1-49人  ['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...    NaN   \n",
       "3       1-49人                                             ['大专']    NaN   \n",
       "4    100-499人                                             ['本科']    NaN   \n",
       "..        ...                                                ...    ...   \n",
       "795  10000人以上                ['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']     大专   \n",
       "796       NaN  ['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...  大专及以上   \n",
       "797  10000人以上  ['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...   统招本科   \n",
       "798    50-99人                  ['新媒体运营', '活动运营', '线上运营', '抖音平台']   统招本科   \n",
       "799  100-499人     ['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']  本科及以上   \n",
       "\n",
       "           行业  \n",
       "0       批发/零售  \n",
       "1        家政服务  \n",
       "2         互联网  \n",
       "3     其他商务服务业  \n",
       "4     生活服务O2O  \n",
       "..        ...  \n",
       "795        日化  \n",
       "796   房地产开发经营  \n",
       "797  货运/物流/仓储  \n",
       "798      智能硬件  \n",
       "799     计算机软件  \n",
       "\n",
       "[743 rows x 8 columns]"
      ]
     },
     "execution_count": 171,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz = df_PM_gz[df_PM_gz['薪资'].str.contains('天') == False]\n",
    "df_PM_gz"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 147,
   "id": "659e7bc0",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职位</th>\n",
       "      <th>薪资</th>\n",
       "      <th>地区</th>\n",
       "      <th>公司</th>\n",
       "      <th>公司规模</th>\n",
       "      <th>职业标签</th>\n",
       "      <th>学历</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>3-5k</td>\n",
       "      <td>广州</td>\n",
       "      <td>广州市拓植文化传播有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>4-7k</td>\n",
       "      <td>广州</td>\n",
       "      <td>慢会所</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '新媒体运营']</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>5-8k</td>\n",
       "      <td>广州-番禺区</td>\n",
       "      <td>广州市学晟惠信息科技有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>2-4k</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>广州花林知行研学旅行服务有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专']</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>新媒体运营（应届生或实习生）</td>\n",
       "      <td>7-10k</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>蜂助手股份有限公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['本科']</td>\n",
       "      <td>NaN</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>新媒体运营（有丛气）</td>\n",
       "      <td>9-15k·13薪</td>\n",
       "      <td>广州-荔湾区</td>\n",
       "      <td>立白集团</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']</td>\n",
       "      <td>大专</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>新媒体运营专员</td>\n",
       "      <td>8-13k·13薪</td>\n",
       "      <td>广州</td>\n",
       "      <td>某知名公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...</td>\n",
       "      <td>大专及以上</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>新媒体运营岗</td>\n",
       "      <td>20-35k</td>\n",
       "      <td>广州-白云区</td>\n",
       "      <td>某广州大型货运/物流/仓储公司</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...</td>\n",
       "      <td>统招本科</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>15-23k·14薪</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>某国内智能硬件公司</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>['新媒体运营', '活动运营', '线上运营', '抖音平台']</td>\n",
       "      <td>统招本科</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>新媒体运营（公众号、Facebook、titok）</td>\n",
       "      <td>10-15k</td>\n",
       "      <td>广州</td>\n",
       "      <td>某广州计算机软件公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']</td>\n",
       "      <td>本科及以上</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>738 rows × 7 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                            职位          薪资      地区                公司  \\\n",
       "0                     新媒体运营实习生        3-5k      广州     广州市拓植文化传播有限公司   \n",
       "1                     新媒体运营实习生        4-7k      广州               慢会所   \n",
       "2                     新媒体运营实习生        5-8k  广州-番禺区    广州市学晟惠信息科技有限公司   \n",
       "3                        新媒体运营        2-4k  广州-海珠区  广州花林知行研学旅行服务有限公司   \n",
       "4               新媒体运营（应届生或实习生）       7-10k  广州-天河区         蜂助手股份有限公司   \n",
       "..                         ...         ...     ...               ...   \n",
       "795                 新媒体运营（有丛气）   9-15k·13薪  广州-荔湾区              立白集团   \n",
       "796                    新媒体运营专员   8-13k·13薪      广州             某知名公司   \n",
       "797                     新媒体运营岗      20-35k  广州-白云区   某广州大型货运/物流/仓储公司   \n",
       "798                      新媒体运营  15-23k·14薪  广州-海珠区         某国内智能硬件公司   \n",
       "799  新媒体运营（公众号、Facebook、titok）      10-15k      广州        某广州计算机软件公司   \n",
       "\n",
       "         公司规模                                               职业标签     学历  \n",
       "0       1-49人  ['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...    NaN  \n",
       "1       1-49人                                    ['本科', '新媒体运营']    NaN  \n",
       "2       1-49人  ['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...    NaN  \n",
       "3       1-49人                                             ['大专']    NaN  \n",
       "4    100-499人                                             ['本科']    NaN  \n",
       "..        ...                                                ...    ...  \n",
       "795  10000人以上                ['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']     大专  \n",
       "796       NaN  ['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...  大专及以上  \n",
       "797  10000人以上  ['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...   统招本科  \n",
       "798    50-99人                  ['新媒体运营', '活动运营', '线上运营', '抖音平台']   统招本科  \n",
       "799  100-499人     ['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']  本科及以上  \n",
       "\n",
       "[738 rows x 7 columns]"
      ]
     },
     "execution_count": 147,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz = df_PM_gz[df_PM_gz['薪资'].str.contains('元') == False]\n",
    "df_PM_gz"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 188,
   "id": "134b2cf5",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职位</th>\n",
       "      <th>薪资</th>\n",
       "      <th>地区</th>\n",
       "      <th>公司</th>\n",
       "      <th>公司规模</th>\n",
       "      <th>职业标签</th>\n",
       "      <th>学历</th>\n",
       "      <th>行业</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>3-5k</td>\n",
       "      <td>广州</td>\n",
       "      <td>广州市拓植文化传播有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>批发/零售</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>4-7k</td>\n",
       "      <td>广州</td>\n",
       "      <td>慢会所</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '新媒体运营']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>家政服务</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>5-8k</td>\n",
       "      <td>广州-番禺区</td>\n",
       "      <td>广州市学晟惠信息科技有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>互联网</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>2-4k</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>广州花林知行研学旅行服务有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>其他商务服务业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>新媒体运营（应届生或实习生）</td>\n",
       "      <td>7-10k</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>蜂助手股份有限公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['本科']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>生活服务O2O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>新媒体运营（有丛气）</td>\n",
       "      <td>9-15k·13薪</td>\n",
       "      <td>广州-荔湾区</td>\n",
       "      <td>立白集团</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']</td>\n",
       "      <td>大专</td>\n",
       "      <td>日化</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>新媒体运营专员</td>\n",
       "      <td>8-13k·13薪</td>\n",
       "      <td>广州</td>\n",
       "      <td>某知名公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>房地产开发经营</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>新媒体运营岗</td>\n",
       "      <td>20-35k</td>\n",
       "      <td>广州-白云区</td>\n",
       "      <td>某广州大型货运/物流/仓储公司</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>货运/物流/仓储</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>15-23k·14薪</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>某国内智能硬件公司</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>['新媒体运营', '活动运营', '线上运营', '抖音平台']</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>智能硬件</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>新媒体运营（公众号、Facebook、titok）</td>\n",
       "      <td>10-15k</td>\n",
       "      <td>广州</td>\n",
       "      <td>某广州计算机软件公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>计算机软件</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>738 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                            职位          薪资      地区                公司  \\\n",
       "0                     新媒体运营实习生        3-5k      广州     广州市拓植文化传播有限公司   \n",
       "1                     新媒体运营实习生        4-7k      广州               慢会所   \n",
       "2                     新媒体运营实习生        5-8k  广州-番禺区    广州市学晟惠信息科技有限公司   \n",
       "3                        新媒体运营        2-4k  广州-海珠区  广州花林知行研学旅行服务有限公司   \n",
       "4               新媒体运营（应届生或实习生）       7-10k  广州-天河区         蜂助手股份有限公司   \n",
       "..                         ...         ...     ...               ...   \n",
       "795                 新媒体运营（有丛气）   9-15k·13薪  广州-荔湾区              立白集团   \n",
       "796                    新媒体运营专员   8-13k·13薪      广州             某知名公司   \n",
       "797                     新媒体运营岗      20-35k  广州-白云区   某广州大型货运/物流/仓储公司   \n",
       "798                      新媒体运营  15-23k·14薪  广州-海珠区         某国内智能硬件公司   \n",
       "799  新媒体运营（公众号、Facebook、titok）      10-15k      广州        某广州计算机软件公司   \n",
       "\n",
       "         公司规模                                               职业标签     学历  \\\n",
       "0       1-49人  ['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...    NaN   \n",
       "1       1-49人                                    ['本科', '新媒体运营']    NaN   \n",
       "2       1-49人  ['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...    NaN   \n",
       "3       1-49人                                             ['大专']    NaN   \n",
       "4    100-499人                                             ['本科']    NaN   \n",
       "..        ...                                                ...    ...   \n",
       "795  10000人以上                ['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']     大专   \n",
       "796       NaN  ['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...  大专及以上   \n",
       "797  10000人以上  ['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...   统招本科   \n",
       "798    50-99人                  ['新媒体运营', '活动运营', '线上运营', '抖音平台']   统招本科   \n",
       "799  100-499人     ['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']  本科及以上   \n",
       "\n",
       "           行业  \n",
       "0       批发/零售  \n",
       "1        家政服务  \n",
       "2         互联网  \n",
       "3     其他商务服务业  \n",
       "4     生活服务O2O  \n",
       "..        ...  \n",
       "795        日化  \n",
       "796   房地产开发经营  \n",
       "797  货运/物流/仓储  \n",
       "798      智能硬件  \n",
       "799     计算机软件  \n",
       "\n",
       "[738 rows x 8 columns]"
      ]
     },
     "execution_count": 188,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz = df_PM_gz[df_PM_gz['薪资'].str.contains('月') == False]\n",
    "df_PM_gz"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 189,
   "id": "4e3ee276",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0            3-5k\n",
       "1            4-7k\n",
       "2            5-8k\n",
       "3            2-4k\n",
       "4           7-10k\n",
       "          ...    \n",
       "795     9-15k·13薪\n",
       "796     8-13k·13薪\n",
       "797        20-35k\n",
       "798    15-23k·14薪\n",
       "799        10-15k\n",
       "Name: 薪资, Length: 738, dtype: object"
      ]
     },
     "execution_count": 189,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz['薪资']"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 173,
   "id": "1f9c322c",
   "metadata": {},
   "outputs": [],
   "source": [
    "##处理数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 190,
   "id": "d9052ce4",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "array(['3-5k', '4-7k', '5-8k', '2-4k', '7-10k', '6-8k·14薪', '4-5k',\n",
       "       '3-6k', '4-7k', '4-6k', '薪资面议', '6-12k', '5-8k', '8-15k', '5-10k',\n",
       "       '4-6k', '15-30k·13薪', '4-6k', '4-6k', '9-12k', '6-8k', '5-9k',\n",
       "       '4-6k·13薪', '10-12k·13薪', '3-6k', '4-8k', '5-10k', '5-10k·13薪',\n",
       "       '5-10k', '5-10k', '4-6k', '4-6k', '5-8k', '5-8k', '5-8k', '4-5k',\n",
       "       '3-5k', '3-6k', '1-2k', '4-8k', '10-15k·14薪', '6-8k', '6-10k',\n",
       "       '3-5k', '7-12k·13薪', '4-6k', '7-9k', '5-8k', '2-4k', '6-12k',\n",
       "       '5-8k', '5-9k', '4-7k', '5-10k·13薪', '2-4k', '6-12k', '3-6k',\n",
       "       '6-8k·13薪', '5-10k', '8-13k', '8-11k', '8-18k·13薪', '5-8k', '4-8k',\n",
       "       '5-9k', '8-10k', '5-6k', '5-7k', '12-25k', '8-13k', '4-5k',\n",
       "       '19-35k', '5-8k', '8-15k', '6-10k', '6-7k', '5-8k', '4-8k', '4-6k',\n",
       "       '1-2k', '7-12k·13薪', '5-10k', '7-8k', '4-8k', '3-4k', '7-12k',\n",
       "       '5-6k', '6-12k', '4-8k', '4-8k', '5-10k', '4-9k', '6-9k', '5-8k',\n",
       "       '3-5k', '3-5k', '4-6k', '8-13k', '6-10k', '15-25k·13薪', '5-8k',\n",
       "       '5-15k', '5-8k', '8-13k·13薪', '4-6k', '5-8k', '9-12k', '6-10k',\n",
       "       '2-4k', '5-10k', '3-5k', '6-10k', '4-6k', '6-12k·13薪', '4-6k',\n",
       "       '4-6k', '3-5k', '2-3k', '5-8k', '8-13k', '4-6k', '6-7k', '5-10k',\n",
       "       '4-6k', '4-7k', '5-8k', '5-15k', '7-9k', '5-8k', '5-8k', '5-8k',\n",
       "       '6-8k', '5-8k', '6-10k', '5-8k', '6-8k', '4-6k·13薪', '5-10k',\n",
       "       '2-3k', '5-8k', '3-6k', '2-3k', '5-7k', '4-7k', '3-7k·13薪', '4-8k',\n",
       "       '9-12k', '4-6k', '6-8k', '4-7k', '3-4k', '5-8k', '5-8k', '5-8k',\n",
       "       '5-8k', '3-5k', '3-5k', '3-5k', '8-12k', '6-12k', '4-8k·13薪',\n",
       "       '3-8k', '4-8k', '4-8k', '4-8k', '5-7k', '5-10k', '6-10k', '5-10k',\n",
       "       '2-5k', '3-4k', '4-7k', '4-5k', '1-2k', '4-6k', '4-8k', '8-12k',\n",
       "       '4-7k', '15-18k', '7-8k', '6-8k', '1-2k', '5-10k·14薪', '3-5k',\n",
       "       '1-2k', '2-3k', '4-8k', '8-12k·14薪', '8-9k', '4-5k', '7-11k',\n",
       "       '7-10k', '7-10k', '5-8k', '6-7k', '6-8k', '1-3k', '4-8k',\n",
       "       '7-9k·13薪', '6-8k', '1-3k', '3-5k', '6-12k', '8-10k·13薪',\n",
       "       '9-13k·14薪', '7-15k·14薪', '5-7k', '5-8k', '6-9k', '6-12k',\n",
       "       '11-22k', '4-6k', '薪资面议', '4-9k', '3-6k', '2-3k', '3-5k', '1-3k',\n",
       "       '6-8k', '10-15k·13薪', '2-3k', '6-8k·13薪', '2-3k', '5-10k', '2-3k',\n",
       "       '5-8k', '6-8k·13薪', '8-12k', '2-3k', '4-6k·13薪', '7-9k', '12-20k',\n",
       "       '15-30k', '5-8k', '5-9k·13薪', '8-15k', '5-8k', '6-9k', '10-15k',\n",
       "       '8-12k', '6-12k', '5-9k', '7-15k', '7-12k', '5-6k', '25-35k·14薪',\n",
       "       '4-8k·13薪', '7-12k', '5-7k', '5-8k', '5-8k', '2-3k', '3-5k',\n",
       "       '2-3k', '3-6k', '10-15k', '8-13k', '12-20k', '15-20k·16薪',\n",
       "       '10-20k', '5-8k', '2-3k', '8-13k', '8-12k', '5-8k', '5-8k', '4-6k',\n",
       "       '5-9k·13薪', '7-10k·13薪', '3-5k', '10-12k·13薪', '5-7k', '15-18k',\n",
       "       '8-16k', '3-4k', '6-11k·13薪', '6-7k·14薪', '3-5k', '6-11k', '6-8k',\n",
       "       '4-8k', '8-13k·13薪', '7-10k', '4-8k', '10-15k', '5-7k', '5-7k',\n",
       "       '12-13k', '4-6k', '8-13k', '8-13k', '4-8k', '6-12k', '3-4k',\n",
       "       '5-10k', '4-12k', '15-23k', '4-6k', '6-11k', '5-10k', '5-7k',\n",
       "       '5-10k', '5-8k', '5-8k', '5-8k', '4-6k', '4-7k', '15-40k', '7-12k',\n",
       "       '3-5k', '5-8k', '7-11k', '7-12k', '4-6k', '6-10k', '4-9k',\n",
       "       '5-9k·13薪', '5-8k', '7-10k', '5-8k', '5-8k', '8-13k', '8-13k',\n",
       "       '5-10k', '5-10k', '8-13k', '3-8k', '10-14k', '6-8k', '6-8k',\n",
       "       '8-12k', '3-4k', '4-8k', '3-6k', '3-5k', '7-9k', '5-8k', '6-10k',\n",
       "       '5-8k', '2-5k', '5-10k', '4-8k', '5-8k', '4-8k', '5-7k', '6-10k',\n",
       "       '6-8k', '4-6k', '5-8k', '4-7k', '6-10k', '15-20k', '4-9k·14薪',\n",
       "       '5-8k', '5-10k', '4-8k', '5-8k', '4-8k', '5-6k', '6-11k', '5-10k',\n",
       "       '4-8k', '10-15k·13薪', '5-10k', '6-10k', '8-13k', '7-10k', '3-4k',\n",
       "       '5-8k', '6-9k', '6-9k', '3-8k', '4-8k', '8-10k', '8-10k', '6-11k',\n",
       "       '7-10k', '8-12k', '6-11k', '5-8k', '5-8k', '3-8k', '5-8k', '2-6k',\n",
       "       '4-8k', '8-10k', '4-7k', '5-8k', '7-12k', '3-8k', '2-5k', '4-6k',\n",
       "       '3-6k', '3-7k', '5-8k', '5-8k', '5-10k', '5-8k', '5-10k', '4-7k',\n",
       "       '4-7k', '4-6k', '3-4k', '4-6k', '8-13k·13薪', '3-4k', '10-15k',\n",
       "       '5-6k', '6-8k·13薪', '6-12k', '15-30k', '6-10k', '5-7k', '8-12k',\n",
       "       '8-12k', '7-10k', '6-10k', '4-6k', '4-6k', '6-8k·13薪', '8-12k',\n",
       "       '7-12k', '5-8k', '3-5k', '6-8k·13薪', '5-8k', '5-6k', '8-15k·13薪',\n",
       "       '8-13k', '10-15k·13薪', '5-10k', '4-6k', '4-6k', '5-8k', '5-8k',\n",
       "       '6-10k', '5-8k', '30-45k', '8-12k', '15-25k', '9-13k', '15-30k',\n",
       "       '20-30k', '12-18k', '6-8k', '6-10k', '8-15k', '6-9k', '8-13k',\n",
       "       '10-20k', '12-15k', '6-8k', '6-8k·13薪', '20-30k', '10-15k',\n",
       "       '8-13k', '18-25k', '7-12k·13薪', '18-25k', '8-12k', '20-30k',\n",
       "       '25-40k', '12-18k·13薪', '6-13k·13薪', '7-10k', '6-9k', '5-7k',\n",
       "       '15-30k', '5-10k', '6-11k', '10-20k·13薪', '22-30k·13薪', '6-9k',\n",
       "       '7-12k', '25-35k', '7-10k·13薪', '5-10k', '15-20k', '15-20k·13薪',\n",
       "       '15-25k', '5-8k', '12-20k·13薪', '8-13k', '6-9k', '20-25k',\n",
       "       '12-28k', '8-10k', '8-15k', '5-10k', '8-10k', '7-12k', '6-10k',\n",
       "       '6-8k·13薪', '5-8k', '5-7k', '5-8k', '6-10k·13薪', '6-8k', '9-15k',\n",
       "       '7-10k', '6-10k', '6-11k', '10-15k', '4-7k', '5-8k', '30-50k',\n",
       "       '15-30k·14薪', '15-30k', '12-23k', '8-13k', '7-11k', '7-10k',\n",
       "       '11-22k', '20-23k', '15-20k', '6-12k', '8-10k', '12-18k', '6-9k',\n",
       "       '6-9k', '8-10k', '20-30k', '7-10k', '8-13k', '10-15k', '10-15k',\n",
       "       '5-9k', '4-6k', '5-10k·13薪', '7-10k', '7-10k', '8-10k·13薪', '5-8k',\n",
       "       '18-22k', '5-8k', '4-6k', '7-10k', '5-10k·13薪', '4-9k', '4-6k',\n",
       "       '4-6k', '8-10k·13薪', '4-8k·13薪', '5-10k', '8-10k', '6-11k',\n",
       "       '5-10k·13薪', '4-6k', '8-10k', '5-8k', '6-18k', '6-10k·14薪',\n",
       "       '10-15k', '6-9k', '8-15k', '12-15k', '15-30k', '10-15k', '20-25k',\n",
       "       '18-25k', '15-30k·13薪', '20-25k·13薪', '28-35k', '10-20k', '18-25k',\n",
       "       '12-17k', '15-20k', '10-15k', '14-20k', '6-11k', '12-17k',\n",
       "       '15-20k', '15-25k', '15-18k·13薪', '12-16k', '15-25k', '16-25k·13薪',\n",
       "       '10-20k', '12-15k·13薪', '13-16k', '5-8k', '7-10k', '6-10k', '5-8k',\n",
       "       '6-8k', '8-13k', '13-14k', '5-10k', '8-15k', '9-13k·13薪', '6-10k',\n",
       "       '15-25k', '9-15k', '5-10k', '8-15k', '6-10k', '7-12k', '7-10k',\n",
       "       '6-7k', '5-10k', '8-15k', '5-8k', '12-18k', '6-12k', '7-10k',\n",
       "       '5-10k', '5-8k', '8-10k', '11-22k', '7-11k·13薪', '7-10k',\n",
       "       '4-6k·13薪', '8-10k', '7-12k', '8-10k·13薪', '6-12k', '4-6k', '4-8k',\n",
       "       '5-8k', '5-8k', '8-10k·13薪', '8-12k', '8-12k', '12-24k', '15-25k',\n",
       "       '5-8k', '15-25k', '6-9k', '8-16k', '8-12k', '8-14k', '9-10k',\n",
       "       '7-12k·13薪', '10-20k', '12-17k', '10-15k·13薪', '6-9k', '10-15k',\n",
       "       '7-10k', '5-8k', '4-8k', '12-16k·13薪', '8-15k·13薪', '8-12k·14薪',\n",
       "       '15-25k', '7-15k·13薪', '6-12k', '4-7k·13薪', '10-15k', '5-8k',\n",
       "       '7-12k·13薪', '6-11k', '5-12k', '8-13k', '6-10k', '9-14k', '8-12k',\n",
       "       '7-10k', '12-15k·13薪', '10-15k', '3-5k', '13-18k·13薪', '16-25k',\n",
       "       '15-22k·13薪', '10-15k', '20-30k', '5-8k·13薪', '20-30k', '20-30k',\n",
       "       '10-20k', '9-14k', '6-10k', '8-12k', '5-8k', '8-13k', '7-8k',\n",
       "       '5-8k', '4-6k', '8-10k', '9-12k', '5-8k', '8-12k', '5-8k', '9-13k',\n",
       "       '15-25k', '7-12k·13薪', '7-12k', '6-8k', '6-10k', '5-10k', '10-15k',\n",
       "       '8-15k', '6-10k', '6-10k·17薪', '6-8k', '20-27k', '6-11k', '6-9k',\n",
       "       '15-30k', '6-8k', '4-6k', '8-12k', '6-8k', '5-8k', '10-15k',\n",
       "       '10-15k', '12-13k', '面议', '15-25k', '10-20k·13薪', '6-8k', '7-10k',\n",
       "       '15-30k', '5-8k', '11-18k·13薪', '6-10k', '6-10k', '9-17k', '8-13k',\n",
       "       '6-10k', '8-10k', '6-9k', '5-8k·14薪', '11-16k', '8-12k', '7-10k',\n",
       "       '10-20k', '6-15k', '12-17k', '6-8k', '7-10k', '10-20k', '6-9k',\n",
       "       '9-15k·13薪', '8-13k·13薪', '20-35k', '15-23k·14薪', '10-15k'],\n",
       "      dtype=object)"
      ]
     },
     "execution_count": 190,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_PM_gz['薪资'].values"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 192,
   "id": "e51ac171",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职位</th>\n",
       "      <th>薪资</th>\n",
       "      <th>地区</th>\n",
       "      <th>公司</th>\n",
       "      <th>公司规模</th>\n",
       "      <th>职业标签</th>\n",
       "      <th>学历</th>\n",
       "      <th>行业</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>3-5k</td>\n",
       "      <td>广州</td>\n",
       "      <td>广州市拓植文化传播有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>批发/零售</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>4-7k</td>\n",
       "      <td>广州</td>\n",
       "      <td>慢会所</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '新媒体运营']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>家政服务</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>5-8k</td>\n",
       "      <td>广州-番禺区</td>\n",
       "      <td>广州市学晟惠信息科技有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>互联网</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>2-4k</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>广州花林知行研学旅行服务有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>其他商务服务业</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>新媒体运营（应届生或实习生）</td>\n",
       "      <td>7-10k</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>蜂助手股份有限公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['本科']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>生活服务O2O</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>新媒体运营（有丛气）</td>\n",
       "      <td>9-15k·13薪</td>\n",
       "      <td>广州-荔湾区</td>\n",
       "      <td>立白集团</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']</td>\n",
       "      <td>大专</td>\n",
       "      <td>日化</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>新媒体运营专员</td>\n",
       "      <td>8-13k·13薪</td>\n",
       "      <td>广州</td>\n",
       "      <td>某知名公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>房地产开发经营</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>新媒体运营岗</td>\n",
       "      <td>20-35k</td>\n",
       "      <td>广州-白云区</td>\n",
       "      <td>某广州大型货运/物流/仓储公司</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>货运/物流/仓储</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>15-23k·14薪</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>某国内智能硬件公司</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>['新媒体运营', '活动运营', '线上运营', '抖音平台']</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>智能硬件</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>新媒体运营（公众号、Facebook、titok）</td>\n",
       "      <td>10-15k</td>\n",
       "      <td>广州</td>\n",
       "      <td>某广州计算机软件公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>计算机软件</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>735 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                            职位          薪资      地区                公司  \\\n",
       "0                     新媒体运营实习生        3-5k      广州     广州市拓植文化传播有限公司   \n",
       "1                     新媒体运营实习生        4-7k      广州               慢会所   \n",
       "2                     新媒体运营实习生        5-8k  广州-番禺区    广州市学晟惠信息科技有限公司   \n",
       "3                        新媒体运营        2-4k  广州-海珠区  广州花林知行研学旅行服务有限公司   \n",
       "4               新媒体运营（应届生或实习生）       7-10k  广州-天河区         蜂助手股份有限公司   \n",
       "..                         ...         ...     ...               ...   \n",
       "795                 新媒体运营（有丛气）   9-15k·13薪  广州-荔湾区              立白集团   \n",
       "796                    新媒体运营专员   8-13k·13薪      广州             某知名公司   \n",
       "797                     新媒体运营岗      20-35k  广州-白云区   某广州大型货运/物流/仓储公司   \n",
       "798                      新媒体运营  15-23k·14薪  广州-海珠区         某国内智能硬件公司   \n",
       "799  新媒体运营（公众号、Facebook、titok）      10-15k      广州        某广州计算机软件公司   \n",
       "\n",
       "         公司规模                                               职业标签     学历  \\\n",
       "0       1-49人  ['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...    NaN   \n",
       "1       1-49人                                    ['本科', '新媒体运营']    NaN   \n",
       "2       1-49人  ['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...    NaN   \n",
       "3       1-49人                                             ['大专']    NaN   \n",
       "4    100-499人                                             ['本科']    NaN   \n",
       "..        ...                                                ...    ...   \n",
       "795  10000人以上                ['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']     大专   \n",
       "796       NaN  ['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...  大专及以上   \n",
       "797  10000人以上  ['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...   统招本科   \n",
       "798    50-99人                  ['新媒体运营', '活动运营', '线上运营', '抖音平台']   统招本科   \n",
       "799  100-499人     ['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']  本科及以上   \n",
       "\n",
       "           行业  \n",
       "0       批发/零售  \n",
       "1        家政服务  \n",
       "2         互联网  \n",
       "3     其他商务服务业  \n",
       "4     生活服务O2O  \n",
       "..        ...  \n",
       "795        日化  \n",
       "796   房地产开发经营  \n",
       "797  货运/物流/仓储  \n",
       "798      智能硬件  \n",
       "799     计算机软件  \n",
       "\n",
       "[735 rows x 8 columns]"
      ]
     },
     "execution_count": 192,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_非薪资面议 = df_PM_gz.query('薪资 != \"薪资面议\" and 薪资!=\"面议\"')\n",
    "df_非薪资面议"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 193,
   "id": "aef794e4",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0            [3-5, ]\n",
       "1            [4-7, ]\n",
       "2            [5-8, ]\n",
       "3            [2-4, ]\n",
       "4           [7-10, ]\n",
       "           ...      \n",
       "795     [9-15, ·13薪]\n",
       "796     [8-13, ·13薪]\n",
       "797        [20-35, ]\n",
       "798    [15-23, ·14薪]\n",
       "799        [10-15, ]\n",
       "Name: 薪资, Length: 735, dtype: object"
      ]
     },
     "execution_count": 193,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_非薪资面议['薪资'].apply(lambda x:x.split('k'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 194,
   "id": "f7d5d180",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0       4.0\n",
       "1       5.5\n",
       "2       6.5\n",
       "3       3.0\n",
       "4       8.5\n",
       "       ... \n",
       "795    12.0\n",
       "796    10.5\n",
       "797    27.5\n",
       "798    19.0\n",
       "799    12.5\n",
       "Name: 薪资, Length: 735, dtype: float64"
      ]
     },
     "execution_count": 194,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 未处理年薪13及以上\n",
    "df_非薪资面议['薪资'].apply(lambda x : ( int(x.split('k')[0].split('-')[0]) + int(x.split('k')[0].split('-')[1]) ) / 2)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 195,
   "id": "08751c8f",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0            [3-5k]\n",
       "1            [4-7k]\n",
       "2            [5-8k]\n",
       "3            [2-4k]\n",
       "4           [7-10k]\n",
       "           ...     \n",
       "795     [9-15k, 13]\n",
       "796     [8-13k, 13]\n",
       "797        [20-35k]\n",
       "798    [15-23k, 14]\n",
       "799        [10-15k]\n",
       "Name: 薪资, Length: 735, dtype: object"
      ]
     },
     "execution_count": 195,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 处理所有的\n",
    "df_非薪资面议['薪资'].apply(lambda x : x.split('薪')[0].split('·'))"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 196,
   "id": "474cdcd3",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[['3-5k'],\n",
       " ['4-7k'],\n",
       " ['5-8k'],\n",
       " ['2-4k'],\n",
       " ['7-10k'],\n",
       " ['6-8k', '14'],\n",
       " ['4-5k'],\n",
       " ['3-6k'],\n",
       " ['4-7k'],\n",
       " ['4-6k'],\n",
       " ['6-12k'],\n",
       " ['5-8k'],\n",
       " ['8-15k'],\n",
       " ['5-10k'],\n",
       " ['4-6k'],\n",
       " ['15-30k', '13'],\n",
       " ['4-6k'],\n",
       " ['4-6k'],\n",
       " ['9-12k'],\n",
       " ['6-8k'],\n",
       " ['5-9k'],\n",
       " ['4-6k', '13'],\n",
       " ['10-12k', '13'],\n",
       " ['3-6k'],\n",
       " ['4-8k'],\n",
       " ['5-10k'],\n",
       " ['5-10k', '13'],\n",
       " ['5-10k'],\n",
       " ['5-10k'],\n",
       " ['4-6k'],\n",
       " ['4-6k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['4-5k'],\n",
       " ['3-5k'],\n",
       " ['3-6k'],\n",
       " ['1-2k'],\n",
       " ['4-8k'],\n",
       " ['10-15k', '14'],\n",
       " ['6-8k'],\n",
       " ['6-10k'],\n",
       " ['3-5k'],\n",
       " ['7-12k', '13'],\n",
       " ['4-6k'],\n",
       " ['7-9k'],\n",
       " ['5-8k'],\n",
       " ['2-4k'],\n",
       " ['6-12k'],\n",
       " ['5-8k'],\n",
       " ['5-9k'],\n",
       " ['4-7k'],\n",
       " ['5-10k', '13'],\n",
       " ['2-4k'],\n",
       " ['6-12k'],\n",
       " ['3-6k'],\n",
       " ['6-8k', '13'],\n",
       " ['5-10k'],\n",
       " ['8-13k'],\n",
       " ['8-11k'],\n",
       " ['8-18k', '13'],\n",
       " ['5-8k'],\n",
       " ['4-8k'],\n",
       " ['5-9k'],\n",
       " ['8-10k'],\n",
       " ['5-6k'],\n",
       " ['5-7k'],\n",
       " ['12-25k'],\n",
       " ['8-13k'],\n",
       " ['4-5k'],\n",
       " ['19-35k'],\n",
       " ['5-8k'],\n",
       " ['8-15k'],\n",
       " ['6-10k'],\n",
       " ['6-7k'],\n",
       " ['5-8k'],\n",
       " ['4-8k'],\n",
       " ['4-6k'],\n",
       " ['1-2k'],\n",
       " ['7-12k', '13'],\n",
       " ['5-10k'],\n",
       " ['7-8k'],\n",
       " ['4-8k'],\n",
       " ['3-4k'],\n",
       " ['7-12k'],\n",
       " ['5-6k'],\n",
       " ['6-12k'],\n",
       " ['4-8k'],\n",
       " ['4-8k'],\n",
       " ['5-10k'],\n",
       " ['4-9k'],\n",
       " ['6-9k'],\n",
       " ['5-8k'],\n",
       " ['3-5k'],\n",
       " ['3-5k'],\n",
       " ['4-6k'],\n",
       " ['8-13k'],\n",
       " ['6-10k'],\n",
       " ['15-25k', '13'],\n",
       " ['5-8k'],\n",
       " ['5-15k'],\n",
       " ['5-8k'],\n",
       " ['8-13k', '13'],\n",
       " ['4-6k'],\n",
       " ['5-8k'],\n",
       " ['9-12k'],\n",
       " ['6-10k'],\n",
       " ['2-4k'],\n",
       " ['5-10k'],\n",
       " ['3-5k'],\n",
       " ['6-10k'],\n",
       " ['4-6k'],\n",
       " ['6-12k', '13'],\n",
       " ['4-6k'],\n",
       " ['4-6k'],\n",
       " ['3-5k'],\n",
       " ['2-3k'],\n",
       " ['5-8k'],\n",
       " ['8-13k'],\n",
       " ['4-6k'],\n",
       " ['6-7k'],\n",
       " ['5-10k'],\n",
       " ['4-6k'],\n",
       " ['4-7k'],\n",
       " ['5-8k'],\n",
       " ['5-15k'],\n",
       " ['7-9k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['6-8k'],\n",
       " ['5-8k'],\n",
       " ['6-10k'],\n",
       " ['5-8k'],\n",
       " ['6-8k'],\n",
       " ['4-6k', '13'],\n",
       " ['5-10k'],\n",
       " ['2-3k'],\n",
       " ['5-8k'],\n",
       " ['3-6k'],\n",
       " ['2-3k'],\n",
       " ['5-7k'],\n",
       " ['4-7k'],\n",
       " ['3-7k', '13'],\n",
       " ['4-8k'],\n",
       " ['9-12k'],\n",
       " ['4-6k'],\n",
       " ['6-8k'],\n",
       " ['4-7k'],\n",
       " ['3-4k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['3-5k'],\n",
       " ['3-5k'],\n",
       " ['3-5k'],\n",
       " ['8-12k'],\n",
       " ['6-12k'],\n",
       " ['4-8k', '13'],\n",
       " ['3-8k'],\n",
       " ['4-8k'],\n",
       " ['4-8k'],\n",
       " ['4-8k'],\n",
       " ['5-7k'],\n",
       " ['5-10k'],\n",
       " ['6-10k'],\n",
       " ['5-10k'],\n",
       " ['2-5k'],\n",
       " ['3-4k'],\n",
       " ['4-7k'],\n",
       " ['4-5k'],\n",
       " ['1-2k'],\n",
       " ['4-6k'],\n",
       " ['4-8k'],\n",
       " ['8-12k'],\n",
       " ['4-7k'],\n",
       " ['15-18k'],\n",
       " ['7-8k'],\n",
       " ['6-8k'],\n",
       " ['1-2k'],\n",
       " ['5-10k', '14'],\n",
       " ['3-5k'],\n",
       " ['1-2k'],\n",
       " ['2-3k'],\n",
       " ['4-8k'],\n",
       " ['8-12k', '14'],\n",
       " ['8-9k'],\n",
       " ['4-5k'],\n",
       " ['7-11k'],\n",
       " ['7-10k'],\n",
       " ['7-10k'],\n",
       " ['5-8k'],\n",
       " ['6-7k'],\n",
       " ['6-8k'],\n",
       " ['1-3k'],\n",
       " ['4-8k'],\n",
       " ['7-9k', '13'],\n",
       " ['6-8k'],\n",
       " ['1-3k'],\n",
       " ['3-5k'],\n",
       " ['6-12k'],\n",
       " ['8-10k', '13'],\n",
       " ['9-13k', '14'],\n",
       " ['7-15k', '14'],\n",
       " ['5-7k'],\n",
       " ['5-8k'],\n",
       " ['6-9k'],\n",
       " ['6-12k'],\n",
       " ['11-22k'],\n",
       " ['4-6k'],\n",
       " ['4-9k'],\n",
       " ['3-6k'],\n",
       " ['2-3k'],\n",
       " ['3-5k'],\n",
       " ['1-3k'],\n",
       " ['6-8k'],\n",
       " ['10-15k', '13'],\n",
       " ['2-3k'],\n",
       " ['6-8k', '13'],\n",
       " ['2-3k'],\n",
       " ['5-10k'],\n",
       " ['2-3k'],\n",
       " ['5-8k'],\n",
       " ['6-8k', '13'],\n",
       " ['8-12k'],\n",
       " ['2-3k'],\n",
       " ['4-6k', '13'],\n",
       " ['7-9k'],\n",
       " ['12-20k'],\n",
       " ['15-30k'],\n",
       " ['5-8k'],\n",
       " ['5-9k', '13'],\n",
       " ['8-15k'],\n",
       " ['5-8k'],\n",
       " ['6-9k'],\n",
       " ['10-15k'],\n",
       " ['8-12k'],\n",
       " ['6-12k'],\n",
       " ['5-9k'],\n",
       " ['7-15k'],\n",
       " ['7-12k'],\n",
       " ['5-6k'],\n",
       " ['25-35k', '14'],\n",
       " ['4-8k', '13'],\n",
       " ['7-12k'],\n",
       " ['5-7k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['2-3k'],\n",
       " ['3-5k'],\n",
       " ['2-3k'],\n",
       " ['3-6k'],\n",
       " ['10-15k'],\n",
       " ['8-13k'],\n",
       " ['12-20k'],\n",
       " ['15-20k', '16'],\n",
       " ['10-20k'],\n",
       " ['5-8k'],\n",
       " ['2-3k'],\n",
       " ['8-13k'],\n",
       " ['8-12k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['4-6k'],\n",
       " ['5-9k', '13'],\n",
       " ['7-10k', '13'],\n",
       " ['3-5k'],\n",
       " ['10-12k', '13'],\n",
       " ['5-7k'],\n",
       " ['15-18k'],\n",
       " ['8-16k'],\n",
       " ['3-4k'],\n",
       " ['6-11k', '13'],\n",
       " ['6-7k', '14'],\n",
       " ['3-5k'],\n",
       " ['6-11k'],\n",
       " ['6-8k'],\n",
       " ['4-8k'],\n",
       " ['8-13k', '13'],\n",
       " ['7-10k'],\n",
       " ['4-8k'],\n",
       " ['10-15k'],\n",
       " ['5-7k'],\n",
       " ['5-7k'],\n",
       " ['12-13k'],\n",
       " ['4-6k'],\n",
       " ['8-13k'],\n",
       " ['8-13k'],\n",
       " ['4-8k'],\n",
       " ['6-12k'],\n",
       " ['3-4k'],\n",
       " ['5-10k'],\n",
       " ['4-12k'],\n",
       " ['15-23k'],\n",
       " ['4-6k'],\n",
       " ['6-11k'],\n",
       " ['5-10k'],\n",
       " ['5-7k'],\n",
       " ['5-10k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['4-6k'],\n",
       " ['4-7k'],\n",
       " ['15-40k'],\n",
       " ['7-12k'],\n",
       " ['3-5k'],\n",
       " ['5-8k'],\n",
       " ['7-11k'],\n",
       " ['7-12k'],\n",
       " ['4-6k'],\n",
       " ['6-10k'],\n",
       " ['4-9k'],\n",
       " ['5-9k', '13'],\n",
       " ['5-8k'],\n",
       " ['7-10k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['8-13k'],\n",
       " ['8-13k'],\n",
       " ['5-10k'],\n",
       " ['5-10k'],\n",
       " ['8-13k'],\n",
       " ['3-8k'],\n",
       " ['10-14k'],\n",
       " ['6-8k'],\n",
       " ['6-8k'],\n",
       " ['8-12k'],\n",
       " ['3-4k'],\n",
       " ['4-8k'],\n",
       " ['3-6k'],\n",
       " ['3-5k'],\n",
       " ['7-9k'],\n",
       " ['5-8k'],\n",
       " ['6-10k'],\n",
       " ['5-8k'],\n",
       " ['2-5k'],\n",
       " ['5-10k'],\n",
       " ['4-8k'],\n",
       " ['5-8k'],\n",
       " ['4-8k'],\n",
       " ['5-7k'],\n",
       " ['6-10k'],\n",
       " ['6-8k'],\n",
       " ['4-6k'],\n",
       " ['5-8k'],\n",
       " ['4-7k'],\n",
       " ['6-10k'],\n",
       " ['15-20k'],\n",
       " ['4-9k', '14'],\n",
       " ['5-8k'],\n",
       " ['5-10k'],\n",
       " ['4-8k'],\n",
       " ['5-8k'],\n",
       " ['4-8k'],\n",
       " ['5-6k'],\n",
       " ['6-11k'],\n",
       " ['5-10k'],\n",
       " ['4-8k'],\n",
       " ['10-15k', '13'],\n",
       " ['5-10k'],\n",
       " ['6-10k'],\n",
       " ['8-13k'],\n",
       " ['7-10k'],\n",
       " ['3-4k'],\n",
       " ['5-8k'],\n",
       " ['6-9k'],\n",
       " ['6-9k'],\n",
       " ['3-8k'],\n",
       " ['4-8k'],\n",
       " ['8-10k'],\n",
       " ['8-10k'],\n",
       " ['6-11k'],\n",
       " ['7-10k'],\n",
       " ['8-12k'],\n",
       " ['6-11k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['3-8k'],\n",
       " ['5-8k'],\n",
       " ['2-6k'],\n",
       " ['4-8k'],\n",
       " ['8-10k'],\n",
       " ['4-7k'],\n",
       " ['5-8k'],\n",
       " ['7-12k'],\n",
       " ['3-8k'],\n",
       " ['2-5k'],\n",
       " ['4-6k'],\n",
       " ['3-6k'],\n",
       " ['3-7k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['5-10k'],\n",
       " ['5-8k'],\n",
       " ['5-10k'],\n",
       " ['4-7k'],\n",
       " ['4-7k'],\n",
       " ['4-6k'],\n",
       " ['3-4k'],\n",
       " ['4-6k'],\n",
       " ['8-13k', '13'],\n",
       " ['3-4k'],\n",
       " ['10-15k'],\n",
       " ['5-6k'],\n",
       " ['6-8k', '13'],\n",
       " ['6-12k'],\n",
       " ['15-30k'],\n",
       " ['6-10k'],\n",
       " ['5-7k'],\n",
       " ['8-12k'],\n",
       " ['8-12k'],\n",
       " ['7-10k'],\n",
       " ['6-10k'],\n",
       " ['4-6k'],\n",
       " ['4-6k'],\n",
       " ['6-8k', '13'],\n",
       " ['8-12k'],\n",
       " ['7-12k'],\n",
       " ['5-8k'],\n",
       " ['3-5k'],\n",
       " ['6-8k', '13'],\n",
       " ['5-8k'],\n",
       " ['5-6k'],\n",
       " ['8-15k', '13'],\n",
       " ['8-13k'],\n",
       " ['10-15k', '13'],\n",
       " ['5-10k'],\n",
       " ['4-6k'],\n",
       " ['4-6k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['6-10k'],\n",
       " ['5-8k'],\n",
       " ['30-45k'],\n",
       " ['8-12k'],\n",
       " ['15-25k'],\n",
       " ['9-13k'],\n",
       " ['15-30k'],\n",
       " ['20-30k'],\n",
       " ['12-18k'],\n",
       " ['6-8k'],\n",
       " ['6-10k'],\n",
       " ['8-15k'],\n",
       " ['6-9k'],\n",
       " ['8-13k'],\n",
       " ['10-20k'],\n",
       " ['12-15k'],\n",
       " ['6-8k'],\n",
       " ['6-8k', '13'],\n",
       " ['20-30k'],\n",
       " ['10-15k'],\n",
       " ['8-13k'],\n",
       " ['18-25k'],\n",
       " ['7-12k', '13'],\n",
       " ['18-25k'],\n",
       " ['8-12k'],\n",
       " ['20-30k'],\n",
       " ['25-40k'],\n",
       " ['12-18k', '13'],\n",
       " ['6-13k', '13'],\n",
       " ['7-10k'],\n",
       " ['6-9k'],\n",
       " ['5-7k'],\n",
       " ['15-30k'],\n",
       " ['5-10k'],\n",
       " ['6-11k'],\n",
       " ['10-20k', '13'],\n",
       " ['22-30k', '13'],\n",
       " ['6-9k'],\n",
       " ['7-12k'],\n",
       " ['25-35k'],\n",
       " ['7-10k', '13'],\n",
       " ['5-10k'],\n",
       " ['15-20k'],\n",
       " ['15-20k', '13'],\n",
       " ['15-25k'],\n",
       " ['5-8k'],\n",
       " ['12-20k', '13'],\n",
       " ['8-13k'],\n",
       " ['6-9k'],\n",
       " ['20-25k'],\n",
       " ['12-28k'],\n",
       " ['8-10k'],\n",
       " ['8-15k'],\n",
       " ['5-10k'],\n",
       " ['8-10k'],\n",
       " ['7-12k'],\n",
       " ['6-10k'],\n",
       " ['6-8k', '13'],\n",
       " ['5-8k'],\n",
       " ['5-7k'],\n",
       " ['5-8k'],\n",
       " ['6-10k', '13'],\n",
       " ['6-8k'],\n",
       " ['9-15k'],\n",
       " ['7-10k'],\n",
       " ['6-10k'],\n",
       " ['6-11k'],\n",
       " ['10-15k'],\n",
       " ['4-7k'],\n",
       " ['5-8k'],\n",
       " ['30-50k'],\n",
       " ['15-30k', '14'],\n",
       " ['15-30k'],\n",
       " ['12-23k'],\n",
       " ['8-13k'],\n",
       " ['7-11k'],\n",
       " ['7-10k'],\n",
       " ['11-22k'],\n",
       " ['20-23k'],\n",
       " ['15-20k'],\n",
       " ['6-12k'],\n",
       " ['8-10k'],\n",
       " ['12-18k'],\n",
       " ['6-9k'],\n",
       " ['6-9k'],\n",
       " ['8-10k'],\n",
       " ['20-30k'],\n",
       " ['7-10k'],\n",
       " ['8-13k'],\n",
       " ['10-15k'],\n",
       " ['10-15k'],\n",
       " ['5-9k'],\n",
       " ['4-6k'],\n",
       " ['5-10k', '13'],\n",
       " ['7-10k'],\n",
       " ['7-10k'],\n",
       " ['8-10k', '13'],\n",
       " ['5-8k'],\n",
       " ['18-22k'],\n",
       " ['5-8k'],\n",
       " ['4-6k'],\n",
       " ['7-10k'],\n",
       " ['5-10k', '13'],\n",
       " ['4-9k'],\n",
       " ['4-6k'],\n",
       " ['4-6k'],\n",
       " ['8-10k', '13'],\n",
       " ['4-8k', '13'],\n",
       " ['5-10k'],\n",
       " ['8-10k'],\n",
       " ['6-11k'],\n",
       " ['5-10k', '13'],\n",
       " ['4-6k'],\n",
       " ['8-10k'],\n",
       " ['5-8k'],\n",
       " ['6-18k'],\n",
       " ['6-10k', '14'],\n",
       " ['10-15k'],\n",
       " ['6-9k'],\n",
       " ['8-15k'],\n",
       " ['12-15k'],\n",
       " ['15-30k'],\n",
       " ['10-15k'],\n",
       " ['20-25k'],\n",
       " ['18-25k'],\n",
       " ['15-30k', '13'],\n",
       " ['20-25k', '13'],\n",
       " ['28-35k'],\n",
       " ['10-20k'],\n",
       " ['18-25k'],\n",
       " ['12-17k'],\n",
       " ['15-20k'],\n",
       " ['10-15k'],\n",
       " ['14-20k'],\n",
       " ['6-11k'],\n",
       " ['12-17k'],\n",
       " ['15-20k'],\n",
       " ['15-25k'],\n",
       " ['15-18k', '13'],\n",
       " ['12-16k'],\n",
       " ['15-25k'],\n",
       " ['16-25k', '13'],\n",
       " ['10-20k'],\n",
       " ['12-15k', '13'],\n",
       " ['13-16k'],\n",
       " ['5-8k'],\n",
       " ['7-10k'],\n",
       " ['6-10k'],\n",
       " ['5-8k'],\n",
       " ['6-8k'],\n",
       " ['8-13k'],\n",
       " ['13-14k'],\n",
       " ['5-10k'],\n",
       " ['8-15k'],\n",
       " ['9-13k', '13'],\n",
       " ['6-10k'],\n",
       " ['15-25k'],\n",
       " ['9-15k'],\n",
       " ['5-10k'],\n",
       " ['8-15k'],\n",
       " ['6-10k'],\n",
       " ['7-12k'],\n",
       " ['7-10k'],\n",
       " ['6-7k'],\n",
       " ['5-10k'],\n",
       " ['8-15k'],\n",
       " ['5-8k'],\n",
       " ['12-18k'],\n",
       " ['6-12k'],\n",
       " ['7-10k'],\n",
       " ['5-10k'],\n",
       " ['5-8k'],\n",
       " ['8-10k'],\n",
       " ['11-22k'],\n",
       " ['7-11k', '13'],\n",
       " ['7-10k'],\n",
       " ['4-6k', '13'],\n",
       " ['8-10k'],\n",
       " ['7-12k'],\n",
       " ['8-10k', '13'],\n",
       " ['6-12k'],\n",
       " ['4-6k'],\n",
       " ['4-8k'],\n",
       " ['5-8k'],\n",
       " ['5-8k'],\n",
       " ['8-10k', '13'],\n",
       " ['8-12k'],\n",
       " ['8-12k'],\n",
       " ['12-24k'],\n",
       " ['15-25k'],\n",
       " ['5-8k'],\n",
       " ['15-25k'],\n",
       " ['6-9k'],\n",
       " ['8-16k'],\n",
       " ['8-12k'],\n",
       " ['8-14k'],\n",
       " ['9-10k'],\n",
       " ['7-12k', '13'],\n",
       " ['10-20k'],\n",
       " ['12-17k'],\n",
       " ['10-15k', '13'],\n",
       " ['6-9k'],\n",
       " ['10-15k'],\n",
       " ['7-10k'],\n",
       " ['5-8k'],\n",
       " ['4-8k'],\n",
       " ['12-16k', '13'],\n",
       " ['8-15k', '13'],\n",
       " ['8-12k', '14'],\n",
       " ['15-25k'],\n",
       " ['7-15k', '13'],\n",
       " ['6-12k'],\n",
       " ['4-7k', '13'],\n",
       " ['10-15k'],\n",
       " ['5-8k'],\n",
       " ['7-12k', '13'],\n",
       " ['6-11k'],\n",
       " ['5-12k'],\n",
       " ['8-13k'],\n",
       " ['6-10k'],\n",
       " ['9-14k'],\n",
       " ['8-12k'],\n",
       " ['7-10k'],\n",
       " ['12-15k', '13'],\n",
       " ['10-15k'],\n",
       " ['3-5k'],\n",
       " ['13-18k', '13'],\n",
       " ['16-25k'],\n",
       " ['15-22k', '13'],\n",
       " ['10-15k'],\n",
       " ['20-30k'],\n",
       " ['5-8k', '13'],\n",
       " ['20-30k'],\n",
       " ['20-30k'],\n",
       " ['10-20k'],\n",
       " ['9-14k'],\n",
       " ['6-10k'],\n",
       " ['8-12k'],\n",
       " ['5-8k'],\n",
       " ['8-13k'],\n",
       " ['7-8k'],\n",
       " ['5-8k'],\n",
       " ['4-6k'],\n",
       " ['8-10k'],\n",
       " ['9-12k'],\n",
       " ['5-8k'],\n",
       " ['8-12k'],\n",
       " ['5-8k'],\n",
       " ['9-13k'],\n",
       " ['15-25k'],\n",
       " ['7-12k', '13'],\n",
       " ['7-12k'],\n",
       " ['6-8k'],\n",
       " ['6-10k'],\n",
       " ['5-10k'],\n",
       " ['10-15k'],\n",
       " ['8-15k'],\n",
       " ['6-10k'],\n",
       " ['6-10k', '17'],\n",
       " ['6-8k'],\n",
       " ['20-27k'],\n",
       " ['6-11k'],\n",
       " ['6-9k'],\n",
       " ['15-30k'],\n",
       " ['6-8k'],\n",
       " ['4-6k'],\n",
       " ['8-12k'],\n",
       " ['6-8k'],\n",
       " ['5-8k'],\n",
       " ['10-15k'],\n",
       " ['10-15k'],\n",
       " ['12-13k'],\n",
       " ['15-25k'],\n",
       " ['10-20k', '13'],\n",
       " ['6-8k'],\n",
       " ['7-10k'],\n",
       " ['15-30k'],\n",
       " ['5-8k'],\n",
       " ['11-18k', '13'],\n",
       " ['6-10k'],\n",
       " ['6-10k'],\n",
       " ['9-17k'],\n",
       " ['8-13k'],\n",
       " ['6-10k'],\n",
       " ['8-10k'],\n",
       " ['6-9k'],\n",
       " ['5-8k', '14'],\n",
       " ['11-16k'],\n",
       " ['8-12k'],\n",
       " ['7-10k'],\n",
       " ['10-20k'],\n",
       " ['6-15k'],\n",
       " ['12-17k'],\n",
       " ['6-8k'],\n",
       " ['7-10k'],\n",
       " ['10-20k'],\n",
       " ['6-9k'],\n",
       " ['9-15k', '13'],\n",
       " ['8-13k', '13'],\n",
       " ['20-35k'],\n",
       " ['15-23k', '14'],\n",
       " ['10-15k']]"
      ]
     },
     "execution_count": 196,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "list_非薪资面议 = df_非薪资面议['薪资'].apply(lambda x : x.split('薪')[0].split('·')).values.tolist()\n",
    "list_非薪资面议"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 197,
   "id": "35994ec2",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "735"
      ]
     },
     "execution_count": 197,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "len(list_非薪资面议)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 198,
   "id": "d60369ac",
   "metadata": {
    "scrolled": true
   },
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[4.0,\n",
       " 5.5,\n",
       " 6.5,\n",
       " 3.0,\n",
       " 8.5,\n",
       " (7.0, 1.1666666666666667),\n",
       " 4.5,\n",
       " 4.5,\n",
       " 5.5,\n",
       " 5.0,\n",
       " 9.0,\n",
       " 6.5,\n",
       " 11.5,\n",
       " 7.5,\n",
       " 5.0,\n",
       " (22.5, 1.0833333333333333),\n",
       " 5.0,\n",
       " 5.0,\n",
       " 10.5,\n",
       " 7.0,\n",
       " 7.0,\n",
       " (5.0, 1.0833333333333333),\n",
       " (11.0, 1.0833333333333333),\n",
       " 4.5,\n",
       " 6.0,\n",
       " 7.5,\n",
       " (7.5, 1.0833333333333333),\n",
       " 7.5,\n",
       " 7.5,\n",
       " 5.0,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 4.5,\n",
       " 4.0,\n",
       " 4.5,\n",
       " 1.5,\n",
       " 6.0,\n",
       " (12.5, 1.1666666666666667),\n",
       " 7.0,\n",
       " 8.0,\n",
       " 4.0,\n",
       " (9.5, 1.0833333333333333),\n",
       " 5.0,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 3.0,\n",
       " 9.0,\n",
       " 6.5,\n",
       " 7.0,\n",
       " 5.5,\n",
       " (7.5, 1.0833333333333333),\n",
       " 3.0,\n",
       " 9.0,\n",
       " 4.5,\n",
       " (7.0, 1.0833333333333333),\n",
       " 7.5,\n",
       " 10.5,\n",
       " 9.5,\n",
       " (13.0, 1.0833333333333333),\n",
       " 6.5,\n",
       " 6.0,\n",
       " 7.0,\n",
       " 9.0,\n",
       " 5.5,\n",
       " 6.0,\n",
       " 18.5,\n",
       " 10.5,\n",
       " 4.5,\n",
       " 27.0,\n",
       " 6.5,\n",
       " 11.5,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 6.0,\n",
       " 5.0,\n",
       " 1.5,\n",
       " (9.5, 1.0833333333333333),\n",
       " 7.5,\n",
       " 7.5,\n",
       " 6.0,\n",
       " 3.5,\n",
       " 9.5,\n",
       " 5.5,\n",
       " 9.0,\n",
       " 6.0,\n",
       " 6.0,\n",
       " 7.5,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 6.5,\n",
       " 4.0,\n",
       " 4.0,\n",
       " 5.0,\n",
       " 10.5,\n",
       " 8.0,\n",
       " (20.0, 1.0833333333333333),\n",
       " 6.5,\n",
       " 10.0,\n",
       " 6.5,\n",
       " (10.5, 1.0833333333333333),\n",
       " 5.0,\n",
       " 6.5,\n",
       " 10.5,\n",
       " 8.0,\n",
       " 3.0,\n",
       " 7.5,\n",
       " 4.0,\n",
       " 8.0,\n",
       " 5.0,\n",
       " (9.0, 1.0833333333333333),\n",
       " 5.0,\n",
       " 5.0,\n",
       " 4.0,\n",
       " 2.5,\n",
       " 6.5,\n",
       " 10.5,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 5.0,\n",
       " 5.5,\n",
       " 6.5,\n",
       " 10.0,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 7.0,\n",
       " 6.5,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 7.0,\n",
       " (5.0, 1.0833333333333333),\n",
       " 7.5,\n",
       " 2.5,\n",
       " 6.5,\n",
       " 4.5,\n",
       " 2.5,\n",
       " 6.0,\n",
       " 5.5,\n",
       " (5.0, 1.0833333333333333),\n",
       " 6.0,\n",
       " 10.5,\n",
       " 5.0,\n",
       " 7.0,\n",
       " 5.5,\n",
       " 3.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 4.0,\n",
       " 4.0,\n",
       " 4.0,\n",
       " 10.0,\n",
       " 9.0,\n",
       " (6.0, 1.0833333333333333),\n",
       " 5.5,\n",
       " 6.0,\n",
       " 6.0,\n",
       " 6.0,\n",
       " 6.0,\n",
       " 7.5,\n",
       " 8.0,\n",
       " 7.5,\n",
       " 3.5,\n",
       " 3.5,\n",
       " 5.5,\n",
       " 4.5,\n",
       " 1.5,\n",
       " 5.0,\n",
       " 6.0,\n",
       " 10.0,\n",
       " 5.5,\n",
       " 16.5,\n",
       " 7.5,\n",
       " 7.0,\n",
       " 1.5,\n",
       " (7.5, 1.1666666666666667),\n",
       " 4.0,\n",
       " 1.5,\n",
       " 2.5,\n",
       " 6.0,\n",
       " (10.0, 1.1666666666666667),\n",
       " 8.5,\n",
       " 4.5,\n",
       " 9.0,\n",
       " 8.5,\n",
       " 8.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 7.0,\n",
       " 2.0,\n",
       " 6.0,\n",
       " (8.0, 1.0833333333333333),\n",
       " 7.0,\n",
       " 2.0,\n",
       " 4.0,\n",
       " 9.0,\n",
       " (9.0, 1.0833333333333333),\n",
       " (11.0, 1.1666666666666667),\n",
       " (11.0, 1.1666666666666667),\n",
       " 6.0,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 9.0,\n",
       " 16.5,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 4.5,\n",
       " 2.5,\n",
       " 4.0,\n",
       " 2.0,\n",
       " 7.0,\n",
       " (12.5, 1.0833333333333333),\n",
       " 2.5,\n",
       " (7.0, 1.0833333333333333),\n",
       " 2.5,\n",
       " 7.5,\n",
       " 2.5,\n",
       " 6.5,\n",
       " (7.0, 1.0833333333333333),\n",
       " 10.0,\n",
       " 2.5,\n",
       " (5.0, 1.0833333333333333),\n",
       " 8.0,\n",
       " 16.0,\n",
       " 22.5,\n",
       " 6.5,\n",
       " (7.0, 1.0833333333333333),\n",
       " 11.5,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 12.5,\n",
       " 10.0,\n",
       " 9.0,\n",
       " 7.0,\n",
       " 11.0,\n",
       " 9.5,\n",
       " 5.5,\n",
       " (30.0, 1.1666666666666667),\n",
       " (6.0, 1.0833333333333333),\n",
       " 9.5,\n",
       " 6.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 2.5,\n",
       " 4.0,\n",
       " 2.5,\n",
       " 4.5,\n",
       " 12.5,\n",
       " 10.5,\n",
       " 16.0,\n",
       " (17.5, 1.3333333333333333),\n",
       " 15.0,\n",
       " 6.5,\n",
       " 2.5,\n",
       " 10.5,\n",
       " 10.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 5.0,\n",
       " (7.0, 1.0833333333333333),\n",
       " (8.5, 1.0833333333333333),\n",
       " 4.0,\n",
       " (11.0, 1.0833333333333333),\n",
       " 6.0,\n",
       " 16.5,\n",
       " 12.0,\n",
       " 3.5,\n",
       " (8.5, 1.0833333333333333),\n",
       " (6.5, 1.1666666666666667),\n",
       " 4.0,\n",
       " 8.5,\n",
       " 7.0,\n",
       " 6.0,\n",
       " (10.5, 1.0833333333333333),\n",
       " 8.5,\n",
       " 6.0,\n",
       " 12.5,\n",
       " 6.0,\n",
       " 6.0,\n",
       " 12.5,\n",
       " 5.0,\n",
       " 10.5,\n",
       " 10.5,\n",
       " 6.0,\n",
       " 9.0,\n",
       " 3.5,\n",
       " 7.5,\n",
       " 8.0,\n",
       " 19.0,\n",
       " 5.0,\n",
       " 8.5,\n",
       " 7.5,\n",
       " 6.0,\n",
       " 7.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 5.0,\n",
       " 5.5,\n",
       " 27.5,\n",
       " 9.5,\n",
       " 4.0,\n",
       " 6.5,\n",
       " 9.0,\n",
       " 9.5,\n",
       " 5.0,\n",
       " 8.0,\n",
       " 6.5,\n",
       " (7.0, 1.0833333333333333),\n",
       " 6.5,\n",
       " 8.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 10.5,\n",
       " 10.5,\n",
       " 7.5,\n",
       " 7.5,\n",
       " 10.5,\n",
       " 5.5,\n",
       " 12.0,\n",
       " 7.0,\n",
       " 7.0,\n",
       " 10.0,\n",
       " 3.5,\n",
       " 6.0,\n",
       " 4.5,\n",
       " 4.0,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 3.5,\n",
       " 7.5,\n",
       " 6.0,\n",
       " 6.5,\n",
       " 6.0,\n",
       " 6.0,\n",
       " 8.0,\n",
       " 7.0,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 5.5,\n",
       " 8.0,\n",
       " 17.5,\n",
       " (6.5, 1.1666666666666667),\n",
       " 6.5,\n",
       " 7.5,\n",
       " 6.0,\n",
       " 6.5,\n",
       " 6.0,\n",
       " 5.5,\n",
       " 8.5,\n",
       " 7.5,\n",
       " 6.0,\n",
       " (12.5, 1.0833333333333333),\n",
       " 7.5,\n",
       " 8.0,\n",
       " 10.5,\n",
       " 8.5,\n",
       " 3.5,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 7.5,\n",
       " 5.5,\n",
       " 6.0,\n",
       " 9.0,\n",
       " 9.0,\n",
       " 8.5,\n",
       " 8.5,\n",
       " 10.0,\n",
       " 8.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 5.5,\n",
       " 6.5,\n",
       " 4.0,\n",
       " 6.0,\n",
       " 9.0,\n",
       " 5.5,\n",
       " 6.5,\n",
       " 9.5,\n",
       " 5.5,\n",
       " 3.5,\n",
       " 5.0,\n",
       " 4.5,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 5.5,\n",
       " 5.5,\n",
       " 5.0,\n",
       " 3.5,\n",
       " 5.0,\n",
       " (10.5, 1.0833333333333333),\n",
       " 3.5,\n",
       " 12.5,\n",
       " 5.5,\n",
       " (7.0, 1.0833333333333333),\n",
       " 9.0,\n",
       " 22.5,\n",
       " 8.0,\n",
       " 6.0,\n",
       " 10.0,\n",
       " 10.0,\n",
       " 8.5,\n",
       " 8.0,\n",
       " 5.0,\n",
       " 5.0,\n",
       " (7.0, 1.0833333333333333),\n",
       " 10.0,\n",
       " 9.5,\n",
       " 6.5,\n",
       " 4.0,\n",
       " (7.0, 1.0833333333333333),\n",
       " 6.5,\n",
       " 5.5,\n",
       " (11.5, 1.0833333333333333),\n",
       " 10.5,\n",
       " (12.5, 1.0833333333333333),\n",
       " 7.5,\n",
       " 5.0,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 37.5,\n",
       " 10.0,\n",
       " 20.0,\n",
       " 11.0,\n",
       " 22.5,\n",
       " 25.0,\n",
       " 15.0,\n",
       " 7.0,\n",
       " 8.0,\n",
       " 11.5,\n",
       " 7.5,\n",
       " 10.5,\n",
       " 15.0,\n",
       " 13.5,\n",
       " 7.0,\n",
       " (7.0, 1.0833333333333333),\n",
       " 25.0,\n",
       " 12.5,\n",
       " 10.5,\n",
       " 21.5,\n",
       " (9.5, 1.0833333333333333),\n",
       " 21.5,\n",
       " 10.0,\n",
       " 25.0,\n",
       " 32.5,\n",
       " (15.0, 1.0833333333333333),\n",
       " (9.5, 1.0833333333333333),\n",
       " 8.5,\n",
       " 7.5,\n",
       " 6.0,\n",
       " 22.5,\n",
       " 7.5,\n",
       " 8.5,\n",
       " (15.0, 1.0833333333333333),\n",
       " (26.0, 1.0833333333333333),\n",
       " 7.5,\n",
       " 9.5,\n",
       " 30.0,\n",
       " (8.5, 1.0833333333333333),\n",
       " 7.5,\n",
       " 17.5,\n",
       " (17.5, 1.0833333333333333),\n",
       " 20.0,\n",
       " 6.5,\n",
       " (16.0, 1.0833333333333333),\n",
       " 10.5,\n",
       " 7.5,\n",
       " 22.5,\n",
       " 20.0,\n",
       " 9.0,\n",
       " 11.5,\n",
       " 7.5,\n",
       " 9.0,\n",
       " 9.5,\n",
       " 8.0,\n",
       " (7.0, 1.0833333333333333),\n",
       " 6.5,\n",
       " 6.0,\n",
       " 6.5,\n",
       " (8.0, 1.0833333333333333),\n",
       " 7.0,\n",
       " 12.0,\n",
       " 8.5,\n",
       " 8.0,\n",
       " 8.5,\n",
       " 12.5,\n",
       " 5.5,\n",
       " 6.5,\n",
       " 40.0,\n",
       " (22.5, 1.1666666666666667),\n",
       " 22.5,\n",
       " 17.5,\n",
       " 10.5,\n",
       " 9.0,\n",
       " 8.5,\n",
       " 16.5,\n",
       " 21.5,\n",
       " 17.5,\n",
       " 9.0,\n",
       " 9.0,\n",
       " 15.0,\n",
       " 7.5,\n",
       " 7.5,\n",
       " 9.0,\n",
       " 25.0,\n",
       " 8.5,\n",
       " 10.5,\n",
       " 12.5,\n",
       " 12.5,\n",
       " 7.0,\n",
       " 5.0,\n",
       " (7.5, 1.0833333333333333),\n",
       " 8.5,\n",
       " 8.5,\n",
       " (9.0, 1.0833333333333333),\n",
       " 6.5,\n",
       " 20.0,\n",
       " 6.5,\n",
       " 5.0,\n",
       " 8.5,\n",
       " (7.5, 1.0833333333333333),\n",
       " 6.5,\n",
       " 5.0,\n",
       " 5.0,\n",
       " (9.0, 1.0833333333333333),\n",
       " (6.0, 1.0833333333333333),\n",
       " 7.5,\n",
       " 9.0,\n",
       " 8.5,\n",
       " (7.5, 1.0833333333333333),\n",
       " 5.0,\n",
       " 9.0,\n",
       " 6.5,\n",
       " 12.0,\n",
       " (8.0, 1.1666666666666667),\n",
       " 12.5,\n",
       " 7.5,\n",
       " 11.5,\n",
       " 13.5,\n",
       " 22.5,\n",
       " 12.5,\n",
       " 22.5,\n",
       " 21.5,\n",
       " (22.5, 1.0833333333333333),\n",
       " (22.5, 1.0833333333333333),\n",
       " 31.5,\n",
       " 15.0,\n",
       " 21.5,\n",
       " 14.5,\n",
       " 17.5,\n",
       " 12.5,\n",
       " 17.0,\n",
       " 8.5,\n",
       " 14.5,\n",
       " 17.5,\n",
       " 20.0,\n",
       " (16.5, 1.0833333333333333),\n",
       " 14.0,\n",
       " 20.0,\n",
       " (20.5, 1.0833333333333333),\n",
       " 15.0,\n",
       " (13.5, 1.0833333333333333),\n",
       " 14.5,\n",
       " 6.5,\n",
       " 8.5,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 7.0,\n",
       " 10.5,\n",
       " 13.5,\n",
       " 7.5,\n",
       " 11.5,\n",
       " (11.0, 1.0833333333333333),\n",
       " 8.0,\n",
       " 20.0,\n",
       " 12.0,\n",
       " 7.5,\n",
       " 11.5,\n",
       " 8.0,\n",
       " 9.5,\n",
       " 8.5,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 11.5,\n",
       " 6.5,\n",
       " 15.0,\n",
       " 9.0,\n",
       " 8.5,\n",
       " 7.5,\n",
       " 6.5,\n",
       " 9.0,\n",
       " 16.5,\n",
       " (9.0, 1.0833333333333333),\n",
       " 8.5,\n",
       " (5.0, 1.0833333333333333),\n",
       " 9.0,\n",
       " 9.5,\n",
       " (9.0, 1.0833333333333333),\n",
       " 9.0,\n",
       " 5.0,\n",
       " 6.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " (9.0, 1.0833333333333333),\n",
       " 10.0,\n",
       " 10.0,\n",
       " 18.0,\n",
       " 20.0,\n",
       " 6.5,\n",
       " 20.0,\n",
       " 7.5,\n",
       " 12.0,\n",
       " 10.0,\n",
       " 11.0,\n",
       " 9.5,\n",
       " (9.5, 1.0833333333333333),\n",
       " 15.0,\n",
       " 14.5,\n",
       " (12.5, 1.0833333333333333),\n",
       " 7.5,\n",
       " 12.5,\n",
       " 8.5,\n",
       " 6.5,\n",
       " 6.0,\n",
       " (14.0, 1.0833333333333333),\n",
       " (11.5, 1.0833333333333333),\n",
       " (10.0, 1.1666666666666667),\n",
       " 20.0,\n",
       " (11.0, 1.0833333333333333),\n",
       " 9.0,\n",
       " (5.5, 1.0833333333333333),\n",
       " 12.5,\n",
       " 6.5,\n",
       " (9.5, 1.0833333333333333),\n",
       " 8.5,\n",
       " 8.5,\n",
       " 10.5,\n",
       " 8.0,\n",
       " 11.5,\n",
       " 10.0,\n",
       " 8.5,\n",
       " (13.5, 1.0833333333333333),\n",
       " 12.5,\n",
       " 4.0,\n",
       " (15.5, 1.0833333333333333),\n",
       " 20.5,\n",
       " (18.5, 1.0833333333333333),\n",
       " 12.5,\n",
       " 25.0,\n",
       " (6.5, 1.0833333333333333),\n",
       " 25.0,\n",
       " 25.0,\n",
       " 15.0,\n",
       " 11.5,\n",
       " 8.0,\n",
       " 10.0,\n",
       " 6.5,\n",
       " 10.5,\n",
       " 7.5,\n",
       " 6.5,\n",
       " 5.0,\n",
       " 9.0,\n",
       " 10.5,\n",
       " 6.5,\n",
       " 10.0,\n",
       " 6.5,\n",
       " 11.0,\n",
       " 20.0,\n",
       " (9.5, 1.0833333333333333),\n",
       " 9.5,\n",
       " 7.0,\n",
       " 8.0,\n",
       " 7.5,\n",
       " 12.5,\n",
       " 11.5,\n",
       " 8.0,\n",
       " (8.0, 1.4166666666666667),\n",
       " 7.0,\n",
       " 23.5,\n",
       " 8.5,\n",
       " 7.5,\n",
       " 22.5,\n",
       " 7.0,\n",
       " 5.0,\n",
       " 10.0,\n",
       " 7.0,\n",
       " 6.5,\n",
       " 12.5,\n",
       " 12.5,\n",
       " 12.5,\n",
       " 20.0,\n",
       " (15.0, 1.0833333333333333),\n",
       " 7.0,\n",
       " 8.5,\n",
       " 22.5,\n",
       " 6.5,\n",
       " (14.5, 1.0833333333333333),\n",
       " 8.0,\n",
       " 8.0,\n",
       " 13.0,\n",
       " 10.5,\n",
       " 8.0,\n",
       " 9.0,\n",
       " 7.5,\n",
       " (6.5, 1.1666666666666667),\n",
       " 13.5,\n",
       " 10.0,\n",
       " 8.5,\n",
       " 15.0,\n",
       " 10.5,\n",
       " 14.5,\n",
       " 7.0,\n",
       " 8.5,\n",
       " 15.0,\n",
       " 7.5,\n",
       " (12.0, 1.0833333333333333),\n",
       " (10.5, 1.0833333333333333),\n",
       " 27.5,\n",
       " (19.0, 1.1666666666666667),\n",
       " 12.5]"
      ]
     },
     "execution_count": 198,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "[(int(i[0][:-1].split('-')[0]) + int(i[0][:-1].split('-')[1])) / 2  if len(i) == 1 else ((int(i[0][:-1].split('-')[0]) + int(i[0][:-1].split('-')[1])) / 2, int(i[1]) / 12) for i in list_非薪资面议]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 199,
   "id": "858aa802",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[4.0,\n",
       " 5.5,\n",
       " 6.5,\n",
       " 3.0,\n",
       " 8.5,\n",
       " 8.2,\n",
       " 4.5,\n",
       " 4.5,\n",
       " 5.5,\n",
       " 5.0,\n",
       " 9.0,\n",
       " 6.5,\n",
       " 11.5,\n",
       " 7.5,\n",
       " 5.0,\n",
       " 24.4,\n",
       " 5.0,\n",
       " 5.0,\n",
       " 10.5,\n",
       " 7.0,\n",
       " 7.0,\n",
       " 5.4,\n",
       " 11.9,\n",
       " 4.5,\n",
       " 6.0,\n",
       " 7.5,\n",
       " 8.1,\n",
       " 7.5,\n",
       " 7.5,\n",
       " 5.0,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 4.5,\n",
       " 4.0,\n",
       " 4.5,\n",
       " 1.5,\n",
       " 6.0,\n",
       " 14.6,\n",
       " 7.0,\n",
       " 8.0,\n",
       " 4.0,\n",
       " 10.3,\n",
       " 5.0,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 3.0,\n",
       " 9.0,\n",
       " 6.5,\n",
       " 7.0,\n",
       " 5.5,\n",
       " 8.1,\n",
       " 3.0,\n",
       " 9.0,\n",
       " 4.5,\n",
       " 7.6,\n",
       " 7.5,\n",
       " 10.5,\n",
       " 9.5,\n",
       " 14.1,\n",
       " 6.5,\n",
       " 6.0,\n",
       " 7.0,\n",
       " 9.0,\n",
       " 5.5,\n",
       " 6.0,\n",
       " 18.5,\n",
       " 10.5,\n",
       " 4.5,\n",
       " 27.0,\n",
       " 6.5,\n",
       " 11.5,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 6.0,\n",
       " 5.0,\n",
       " 1.5,\n",
       " 10.3,\n",
       " 7.5,\n",
       " 7.5,\n",
       " 6.0,\n",
       " 3.5,\n",
       " 9.5,\n",
       " 5.5,\n",
       " 9.0,\n",
       " 6.0,\n",
       " 6.0,\n",
       " 7.5,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 6.5,\n",
       " 4.0,\n",
       " 4.0,\n",
       " 5.0,\n",
       " 10.5,\n",
       " 8.0,\n",
       " 21.7,\n",
       " 6.5,\n",
       " 10.0,\n",
       " 6.5,\n",
       " 11.4,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 10.5,\n",
       " 8.0,\n",
       " 3.0,\n",
       " 7.5,\n",
       " 4.0,\n",
       " 8.0,\n",
       " 5.0,\n",
       " 9.8,\n",
       " 5.0,\n",
       " 5.0,\n",
       " 4.0,\n",
       " 2.5,\n",
       " 6.5,\n",
       " 10.5,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 5.0,\n",
       " 5.5,\n",
       " 6.5,\n",
       " 10.0,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 7.0,\n",
       " 6.5,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 7.0,\n",
       " 5.4,\n",
       " 7.5,\n",
       " 2.5,\n",
       " 6.5,\n",
       " 4.5,\n",
       " 2.5,\n",
       " 6.0,\n",
       " 5.5,\n",
       " 5.4,\n",
       " 6.0,\n",
       " 10.5,\n",
       " 5.0,\n",
       " 7.0,\n",
       " 5.5,\n",
       " 3.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 4.0,\n",
       " 4.0,\n",
       " 4.0,\n",
       " 10.0,\n",
       " 9.0,\n",
       " 6.5,\n",
       " 5.5,\n",
       " 6.0,\n",
       " 6.0,\n",
       " 6.0,\n",
       " 6.0,\n",
       " 7.5,\n",
       " 8.0,\n",
       " 7.5,\n",
       " 3.5,\n",
       " 3.5,\n",
       " 5.5,\n",
       " 4.5,\n",
       " 1.5,\n",
       " 5.0,\n",
       " 6.0,\n",
       " 10.0,\n",
       " 5.5,\n",
       " 16.5,\n",
       " 7.5,\n",
       " 7.0,\n",
       " 1.5,\n",
       " 8.8,\n",
       " 4.0,\n",
       " 1.5,\n",
       " 2.5,\n",
       " 6.0,\n",
       " 11.7,\n",
       " 8.5,\n",
       " 4.5,\n",
       " 9.0,\n",
       " 8.5,\n",
       " 8.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 7.0,\n",
       " 2.0,\n",
       " 6.0,\n",
       " 8.7,\n",
       " 7.0,\n",
       " 2.0,\n",
       " 4.0,\n",
       " 9.0,\n",
       " 9.8,\n",
       " 12.8,\n",
       " 12.8,\n",
       " 6.0,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 9.0,\n",
       " 16.5,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 4.5,\n",
       " 2.5,\n",
       " 4.0,\n",
       " 2.0,\n",
       " 7.0,\n",
       " 13.5,\n",
       " 2.5,\n",
       " 7.6,\n",
       " 2.5,\n",
       " 7.5,\n",
       " 2.5,\n",
       " 6.5,\n",
       " 7.6,\n",
       " 10.0,\n",
       " 2.5,\n",
       " 5.4,\n",
       " 8.0,\n",
       " 16.0,\n",
       " 22.5,\n",
       " 6.5,\n",
       " 7.6,\n",
       " 11.5,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 12.5,\n",
       " 10.0,\n",
       " 9.0,\n",
       " 7.0,\n",
       " 11.0,\n",
       " 9.5,\n",
       " 5.5,\n",
       " 35.0,\n",
       " 6.5,\n",
       " 9.5,\n",
       " 6.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 2.5,\n",
       " 4.0,\n",
       " 2.5,\n",
       " 4.5,\n",
       " 12.5,\n",
       " 10.5,\n",
       " 16.0,\n",
       " 23.3,\n",
       " 15.0,\n",
       " 6.5,\n",
       " 2.5,\n",
       " 10.5,\n",
       " 10.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 5.0,\n",
       " 7.6,\n",
       " 9.2,\n",
       " 4.0,\n",
       " 11.9,\n",
       " 6.0,\n",
       " 16.5,\n",
       " 12.0,\n",
       " 3.5,\n",
       " 9.2,\n",
       " 7.6,\n",
       " 4.0,\n",
       " 8.5,\n",
       " 7.0,\n",
       " 6.0,\n",
       " 11.4,\n",
       " 8.5,\n",
       " 6.0,\n",
       " 12.5,\n",
       " 6.0,\n",
       " 6.0,\n",
       " 12.5,\n",
       " 5.0,\n",
       " 10.5,\n",
       " 10.5,\n",
       " 6.0,\n",
       " 9.0,\n",
       " 3.5,\n",
       " 7.5,\n",
       " 8.0,\n",
       " 19.0,\n",
       " 5.0,\n",
       " 8.5,\n",
       " 7.5,\n",
       " 6.0,\n",
       " 7.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 5.0,\n",
       " 5.5,\n",
       " 27.5,\n",
       " 9.5,\n",
       " 4.0,\n",
       " 6.5,\n",
       " 9.0,\n",
       " 9.5,\n",
       " 5.0,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 7.6,\n",
       " 6.5,\n",
       " 8.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 10.5,\n",
       " 10.5,\n",
       " 7.5,\n",
       " 7.5,\n",
       " 10.5,\n",
       " 5.5,\n",
       " 12.0,\n",
       " 7.0,\n",
       " 7.0,\n",
       " 10.0,\n",
       " 3.5,\n",
       " 6.0,\n",
       " 4.5,\n",
       " 4.0,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 3.5,\n",
       " 7.5,\n",
       " 6.0,\n",
       " 6.5,\n",
       " 6.0,\n",
       " 6.0,\n",
       " 8.0,\n",
       " 7.0,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 5.5,\n",
       " 8.0,\n",
       " 17.5,\n",
       " 7.6,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 6.0,\n",
       " 6.5,\n",
       " 6.0,\n",
       " 5.5,\n",
       " 8.5,\n",
       " 7.5,\n",
       " 6.0,\n",
       " 13.5,\n",
       " 7.5,\n",
       " 8.0,\n",
       " 10.5,\n",
       " 8.5,\n",
       " 3.5,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 7.5,\n",
       " 5.5,\n",
       " 6.0,\n",
       " 9.0,\n",
       " 9.0,\n",
       " 8.5,\n",
       " 8.5,\n",
       " 10.0,\n",
       " 8.5,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 5.5,\n",
       " 6.5,\n",
       " 4.0,\n",
       " 6.0,\n",
       " 9.0,\n",
       " 5.5,\n",
       " 6.5,\n",
       " 9.5,\n",
       " 5.5,\n",
       " 3.5,\n",
       " 5.0,\n",
       " 4.5,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 5.5,\n",
       " 5.5,\n",
       " 5.0,\n",
       " 3.5,\n",
       " 5.0,\n",
       " 11.4,\n",
       " 3.5,\n",
       " 12.5,\n",
       " 5.5,\n",
       " 7.6,\n",
       " 9.0,\n",
       " 22.5,\n",
       " 8.0,\n",
       " 6.0,\n",
       " 10.0,\n",
       " 10.0,\n",
       " 8.5,\n",
       " 8.0,\n",
       " 5.0,\n",
       " 5.0,\n",
       " 7.6,\n",
       " 10.0,\n",
       " 9.5,\n",
       " 6.5,\n",
       " 4.0,\n",
       " 7.6,\n",
       " 6.5,\n",
       " 5.5,\n",
       " 12.5,\n",
       " 10.5,\n",
       " 13.5,\n",
       " 7.5,\n",
       " 5.0,\n",
       " 5.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 37.5,\n",
       " 10.0,\n",
       " 20.0,\n",
       " 11.0,\n",
       " 22.5,\n",
       " 25.0,\n",
       " 15.0,\n",
       " 7.0,\n",
       " 8.0,\n",
       " 11.5,\n",
       " 7.5,\n",
       " 10.5,\n",
       " 15.0,\n",
       " 13.5,\n",
       " 7.0,\n",
       " 7.6,\n",
       " 25.0,\n",
       " 12.5,\n",
       " 10.5,\n",
       " 21.5,\n",
       " 10.3,\n",
       " 21.5,\n",
       " 10.0,\n",
       " 25.0,\n",
       " 32.5,\n",
       " 16.2,\n",
       " 10.3,\n",
       " 8.5,\n",
       " 7.5,\n",
       " 6.0,\n",
       " 22.5,\n",
       " 7.5,\n",
       " 8.5,\n",
       " 16.2,\n",
       " 28.2,\n",
       " 7.5,\n",
       " 9.5,\n",
       " 30.0,\n",
       " 9.2,\n",
       " 7.5,\n",
       " 17.5,\n",
       " 19.0,\n",
       " 20.0,\n",
       " 6.5,\n",
       " 17.3,\n",
       " 10.5,\n",
       " 7.5,\n",
       " 22.5,\n",
       " 20.0,\n",
       " 9.0,\n",
       " 11.5,\n",
       " 7.5,\n",
       " 9.0,\n",
       " 9.5,\n",
       " 8.0,\n",
       " 7.6,\n",
       " 6.5,\n",
       " 6.0,\n",
       " 6.5,\n",
       " 8.7,\n",
       " 7.0,\n",
       " 12.0,\n",
       " 8.5,\n",
       " 8.0,\n",
       " 8.5,\n",
       " 12.5,\n",
       " 5.5,\n",
       " 6.5,\n",
       " 40.0,\n",
       " 26.2,\n",
       " 22.5,\n",
       " 17.5,\n",
       " 10.5,\n",
       " 9.0,\n",
       " 8.5,\n",
       " 16.5,\n",
       " 21.5,\n",
       " 17.5,\n",
       " 9.0,\n",
       " 9.0,\n",
       " 15.0,\n",
       " 7.5,\n",
       " 7.5,\n",
       " 9.0,\n",
       " 25.0,\n",
       " 8.5,\n",
       " 10.5,\n",
       " 12.5,\n",
       " 12.5,\n",
       " 7.0,\n",
       " 5.0,\n",
       " 8.1,\n",
       " 8.5,\n",
       " 8.5,\n",
       " 9.8,\n",
       " 6.5,\n",
       " 20.0,\n",
       " 6.5,\n",
       " 5.0,\n",
       " 8.5,\n",
       " 8.1,\n",
       " 6.5,\n",
       " 5.0,\n",
       " 5.0,\n",
       " 9.8,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 9.0,\n",
       " 8.5,\n",
       " 8.1,\n",
       " 5.0,\n",
       " 9.0,\n",
       " 6.5,\n",
       " 12.0,\n",
       " 9.3,\n",
       " 12.5,\n",
       " 7.5,\n",
       " 11.5,\n",
       " 13.5,\n",
       " 22.5,\n",
       " 12.5,\n",
       " 22.5,\n",
       " 21.5,\n",
       " 24.4,\n",
       " 24.4,\n",
       " 31.5,\n",
       " 15.0,\n",
       " 21.5,\n",
       " 14.5,\n",
       " 17.5,\n",
       " 12.5,\n",
       " 17.0,\n",
       " 8.5,\n",
       " 14.5,\n",
       " 17.5,\n",
       " 20.0,\n",
       " 17.9,\n",
       " 14.0,\n",
       " 20.0,\n",
       " 22.2,\n",
       " 15.0,\n",
       " 14.6,\n",
       " 14.5,\n",
       " 6.5,\n",
       " 8.5,\n",
       " 8.0,\n",
       " 6.5,\n",
       " 7.0,\n",
       " 10.5,\n",
       " 13.5,\n",
       " 7.5,\n",
       " 11.5,\n",
       " 11.9,\n",
       " 8.0,\n",
       " 20.0,\n",
       " 12.0,\n",
       " 7.5,\n",
       " 11.5,\n",
       " 8.0,\n",
       " 9.5,\n",
       " 8.5,\n",
       " 6.5,\n",
       " 7.5,\n",
       " 11.5,\n",
       " 6.5,\n",
       " 15.0,\n",
       " 9.0,\n",
       " 8.5,\n",
       " 7.5,\n",
       " 6.5,\n",
       " 9.0,\n",
       " 16.5,\n",
       " 9.8,\n",
       " 8.5,\n",
       " 5.4,\n",
       " 9.0,\n",
       " 9.5,\n",
       " 9.8,\n",
       " 9.0,\n",
       " 5.0,\n",
       " 6.0,\n",
       " 6.5,\n",
       " 6.5,\n",
       " 9.8,\n",
       " 10.0,\n",
       " 10.0,\n",
       " 18.0,\n",
       " 20.0,\n",
       " 6.5,\n",
       " 20.0,\n",
       " 7.5,\n",
       " 12.0,\n",
       " 10.0,\n",
       " 11.0,\n",
       " 9.5,\n",
       " 10.3,\n",
       " 15.0,\n",
       " 14.5,\n",
       " 13.5,\n",
       " 7.5,\n",
       " 12.5,\n",
       " 8.5,\n",
       " 6.5,\n",
       " 6.0,\n",
       " 15.2,\n",
       " 12.5,\n",
       " 11.7,\n",
       " 20.0,\n",
       " 11.9,\n",
       " 9.0,\n",
       " 6.0,\n",
       " 12.5,\n",
       " 6.5,\n",
       " 10.3,\n",
       " 8.5,\n",
       " 8.5,\n",
       " 10.5,\n",
       " 8.0,\n",
       " 11.5,\n",
       " 10.0,\n",
       " 8.5,\n",
       " 14.6,\n",
       " 12.5,\n",
       " 4.0,\n",
       " 16.8,\n",
       " 20.5,\n",
       " 20.0,\n",
       " 12.5,\n",
       " 25.0,\n",
       " 7.0,\n",
       " 25.0,\n",
       " 25.0,\n",
       " 15.0,\n",
       " 11.5,\n",
       " 8.0,\n",
       " 10.0,\n",
       " 6.5,\n",
       " 10.5,\n",
       " 7.5,\n",
       " 6.5,\n",
       " 5.0,\n",
       " 9.0,\n",
       " 10.5,\n",
       " 6.5,\n",
       " 10.0,\n",
       " 6.5,\n",
       " 11.0,\n",
       " 20.0,\n",
       " 10.3,\n",
       " 9.5,\n",
       " 7.0,\n",
       " 8.0,\n",
       " 7.5,\n",
       " 12.5,\n",
       " 11.5,\n",
       " 8.0,\n",
       " 11.3,\n",
       " 7.0,\n",
       " 23.5,\n",
       " 8.5,\n",
       " 7.5,\n",
       " 22.5,\n",
       " 7.0,\n",
       " 5.0,\n",
       " 10.0,\n",
       " 7.0,\n",
       " 6.5,\n",
       " 12.5,\n",
       " 12.5,\n",
       " 12.5,\n",
       " 20.0,\n",
       " 16.2,\n",
       " 7.0,\n",
       " 8.5,\n",
       " 22.5,\n",
       " 6.5,\n",
       " 15.7,\n",
       " 8.0,\n",
       " 8.0,\n",
       " 13.0,\n",
       " 10.5,\n",
       " 8.0,\n",
       " 9.0,\n",
       " 7.5,\n",
       " 7.6,\n",
       " 13.5,\n",
       " 10.0,\n",
       " 8.5,\n",
       " 15.0,\n",
       " 10.5,\n",
       " 14.5,\n",
       " 7.0,\n",
       " 8.5,\n",
       " 15.0,\n",
       " 7.5,\n",
       " 13.0,\n",
       " 11.4,\n",
       " 27.5,\n",
       " 22.2,\n",
       " 12.5]"
      ]
     },
     "execution_count": 199,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "平均薪资 = [(int(i[0][:-1].split('-')[0]) + int(i[0][:-1].split('-')[1])) / 2  if len(i) == 1 else round((int(i[0][:-1].split('-')[0]) + int(i[0][:-1].split('-')[1])) / 2 * int(i[1]) / 12, 1) for i in list_非薪资面议]\n",
    "平均薪资"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 200,
   "id": "fa79432a",
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-200-26b58d6be08b>:1: SettingWithCopyWarning: \n",
      "A value is trying to be set on a copy of a slice from a DataFrame.\n",
      "Try using .loc[row_indexer,col_indexer] = value instead\n",
      "\n",
      "See the caveats in the documentation: https://pandas.pydata.org/pandas-docs/stable/user_guide/indexing.html#returning-a-view-versus-a-copy\n",
      "  df_非薪资面议['平均薪资'] = 平均薪资\n"
     ]
    },
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>职位</th>\n",
       "      <th>薪资</th>\n",
       "      <th>地区</th>\n",
       "      <th>公司</th>\n",
       "      <th>公司规模</th>\n",
       "      <th>职业标签</th>\n",
       "      <th>学历</th>\n",
       "      <th>行业</th>\n",
       "      <th>平均薪资</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>3-5k</td>\n",
       "      <td>广州</td>\n",
       "      <td>广州市拓植文化传播有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>批发/零售</td>\n",
       "      <td>4.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>4-7k</td>\n",
       "      <td>广州</td>\n",
       "      <td>慢会所</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '新媒体运营']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>家政服务</td>\n",
       "      <td>5.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>新媒体运营实习生</td>\n",
       "      <td>5-8k</td>\n",
       "      <td>广州-番禺区</td>\n",
       "      <td>广州市学晟惠信息科技有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...</td>\n",
       "      <td>NaN</td>\n",
       "      <td>互联网</td>\n",
       "      <td>6.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>2-4k</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>广州花林知行研学旅行服务有限公司</td>\n",
       "      <td>1-49人</td>\n",
       "      <td>['大专']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>其他商务服务业</td>\n",
       "      <td>3.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>新媒体运营（应届生或实习生）</td>\n",
       "      <td>7-10k</td>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>蜂助手股份有限公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['本科']</td>\n",
       "      <td>NaN</td>\n",
       "      <td>生活服务O2O</td>\n",
       "      <td>8.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>新媒体运营（有丛气）</td>\n",
       "      <td>9-15k·13薪</td>\n",
       "      <td>广州-荔湾区</td>\n",
       "      <td>立白集团</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']</td>\n",
       "      <td>大专</td>\n",
       "      <td>日化</td>\n",
       "      <td>13.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>新媒体运营专员</td>\n",
       "      <td>8-13k·13薪</td>\n",
       "      <td>广州</td>\n",
       "      <td>某知名公司</td>\n",
       "      <td>NaN</td>\n",
       "      <td>['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...</td>\n",
       "      <td>大专及以上</td>\n",
       "      <td>房地产开发经营</td>\n",
       "      <td>11.4</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>新媒体运营岗</td>\n",
       "      <td>20-35k</td>\n",
       "      <td>广州-白云区</td>\n",
       "      <td>某广州大型货运/物流/仓储公司</td>\n",
       "      <td>10000人以上</td>\n",
       "      <td>['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>货运/物流/仓储</td>\n",
       "      <td>27.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>新媒体运营</td>\n",
       "      <td>15-23k·14薪</td>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>某国内智能硬件公司</td>\n",
       "      <td>50-99人</td>\n",
       "      <td>['新媒体运营', '活动运营', '线上运营', '抖音平台']</td>\n",
       "      <td>统招本科</td>\n",
       "      <td>智能硬件</td>\n",
       "      <td>22.2</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>新媒体运营（公众号、Facebook、titok）</td>\n",
       "      <td>10-15k</td>\n",
       "      <td>广州</td>\n",
       "      <td>某广州计算机软件公司</td>\n",
       "      <td>100-499人</td>\n",
       "      <td>['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']</td>\n",
       "      <td>本科及以上</td>\n",
       "      <td>计算机软件</td>\n",
       "      <td>12.5</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>735 rows × 9 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                            职位          薪资      地区                公司  \\\n",
       "0                     新媒体运营实习生        3-5k      广州     广州市拓植文化传播有限公司   \n",
       "1                     新媒体运营实习生        4-7k      广州               慢会所   \n",
       "2                     新媒体运营实习生        5-8k  广州-番禺区    广州市学晟惠信息科技有限公司   \n",
       "3                        新媒体运营        2-4k  广州-海珠区  广州花林知行研学旅行服务有限公司   \n",
       "4               新媒体运营（应届生或实习生）       7-10k  广州-天河区         蜂助手股份有限公司   \n",
       "..                         ...         ...     ...               ...   \n",
       "795                 新媒体运营（有丛气）   9-15k·13薪  广州-荔湾区              立白集团   \n",
       "796                    新媒体运营专员   8-13k·13薪      广州             某知名公司   \n",
       "797                     新媒体运营岗      20-35k  广州-白云区   某广州大型货运/物流/仓储公司   \n",
       "798                      新媒体运营  15-23k·14薪  广州-海珠区         某国内智能硬件公司   \n",
       "799  新媒体运营（公众号、Facebook、titok）      10-15k      广州        某广州计算机软件公司   \n",
       "\n",
       "         公司规模                                               职业标签     学历  \\\n",
       "0       1-49人  ['大专', '新媒体运营', '微信公众号', '新媒体平台', '微博平台', '快手平...    NaN   \n",
       "1       1-49人                                    ['本科', '新媒体运营']    NaN   \n",
       "2       1-49人  ['本科', '微信公众号', '新媒体运营', '社群运营', '新闻类', '生活类',...    NaN   \n",
       "3       1-49人                                             ['大专']    NaN   \n",
       "4    100-499人                                             ['本科']    NaN   \n",
       "..        ...                                                ...    ...   \n",
       "795  10000人以上                ['自媒体运营', '新媒体运营', '自媒体平台', '抖音平台']     大专   \n",
       "796       NaN  ['内容运营', '新媒体运营', '短视频运营', '粉丝运营', '服装/纺织/皮革',...  大专及以上   \n",
       "797  10000人以上  ['新媒体运营', '小红书平台', '短视频运营', 'to C', '线上运营', '抖...   统招本科   \n",
       "798    50-99人                  ['新媒体运营', '活动运营', '线上运营', '抖音平台']   统招本科   \n",
       "799  100-499人     ['新媒体平台', '微信公众号', '英语', '线上运营', 'Facebook平台']  本科及以上   \n",
       "\n",
       "           行业  平均薪资  \n",
       "0       批发/零售   4.0  \n",
       "1        家政服务   5.5  \n",
       "2         互联网   6.5  \n",
       "3     其他商务服务业   3.0  \n",
       "4     生活服务O2O   8.5  \n",
       "..        ...   ...  \n",
       "795        日化  13.0  \n",
       "796   房地产开发经营  11.4  \n",
       "797  货运/物流/仓储  27.5  \n",
       "798      智能硬件  22.2  \n",
       "799     计算机软件  12.5  \n",
       "\n",
       "[735 rows x 9 columns]"
      ]
     },
     "execution_count": 200,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_非薪资面议['平均薪资'] = 平均薪资\n",
    "df_非薪资面议"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 201,
   "id": "6630798b",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>平均薪资</th>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>地区</th>\n",
       "      <th></th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>广州</th>\n",
       "      <td>7.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州-从化区</th>\n",
       "      <td>5.25</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州-南沙区</th>\n",
       "      <td>7.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州-增城区</th>\n",
       "      <td>7.60</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州-天河区</th>\n",
       "      <td>8.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州-海珠区</th>\n",
       "      <td>7.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州-番禺区</th>\n",
       "      <td>7.80</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州-白云区</th>\n",
       "      <td>8.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州-花都区</th>\n",
       "      <td>6.75</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州-荔湾区</th>\n",
       "      <td>7.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州-越秀区</th>\n",
       "      <td>8.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>广州-黄埔区</th>\n",
       "      <td>9.50</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "        平均薪资\n",
       "地区          \n",
       "广州      7.50\n",
       "广州-从化区  5.25\n",
       "广州-南沙区  7.50\n",
       "广州-增城区  7.60\n",
       "广州-天河区  8.00\n",
       "广州-海珠区  7.50\n",
       "广州-番禺区  7.80\n",
       "广州-白云区  8.50\n",
       "广州-花都区  6.75\n",
       "广州-荔湾区  7.50\n",
       "广州-越秀区  8.50\n",
       "广州-黄埔区  9.50"
      ]
     },
     "execution_count": 201,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 分地区看产品经理岗位中位数\n",
    "df_非薪资面议.groupby('地区').agg({'平均薪资': 'median'})"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 202,
   "id": "f8c49427",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>地区</th>\n",
       "      <th>平均薪资</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>广州-从化区</td>\n",
       "      <td>5.25</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>广州-花都区</td>\n",
       "      <td>6.75</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>广州-南沙区</td>\n",
       "      <td>7.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>7.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>广州-荔湾区</td>\n",
       "      <td>7.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>广州-增城区</td>\n",
       "      <td>7.60</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>广州-番禺区</td>\n",
       "      <td>7.80</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>8.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>广州-白云区</td>\n",
       "      <td>8.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>广州-越秀区</td>\n",
       "      <td>8.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>广州-黄埔区</td>\n",
       "      <td>9.50</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "        地区  平均薪资\n",
       "1   广州-从化区  5.25\n",
       "8   广州-花都区  6.75\n",
       "2   广州-南沙区  7.50\n",
       "5   广州-海珠区  7.50\n",
       "9   广州-荔湾区  7.50\n",
       "3   广州-增城区  7.60\n",
       "6   广州-番禺区  7.80\n",
       "4   广州-天河区  8.00\n",
       "7   广州-白云区  8.50\n",
       "10  广州-越秀区  8.50\n",
       "11  广州-黄埔区  9.50"
      ]
     },
     "execution_count": 202,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 地区\n",
    "非薪资面议_地区 = df_非薪资面议.groupby('地区').agg({'平均薪资': 'median'}).reset_index().query('地区!=\"广州\"').sort_values('平均薪资')\n",
    "非薪资面议_地区"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 203,
   "id": "04f393ac",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>学历</th>\n",
       "      <th>平均薪资</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>中专/中技</td>\n",
       "      <td>6.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>大专</td>\n",
       "      <td>7.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>学历不限</td>\n",
       "      <td>7.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>本科</td>\n",
       "      <td>8.10</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>初中</td>\n",
       "      <td>10.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>硕士</td>\n",
       "      <td>10.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>11.90</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>12.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>本科及以上</td>\n",
       "      <td>16.25</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "      学历   平均薪资\n",
       "0  中专/中技   6.50\n",
       "2     大专   7.50\n",
       "4   学历不限   7.50\n",
       "5     本科   8.10\n",
       "1     初中  10.00\n",
       "7     硕士  10.50\n",
       "8   统招本科  11.90\n",
       "3  大专及以上  12.50\n",
       "6  本科及以上  16.25"
      ]
     },
     "execution_count": 203,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 学历\n",
    "非薪资面议_学历 = df_非薪资面议.groupby('学历').agg({'平均薪资': 'median'}).reset_index().sort_values('平均薪资')\n",
    "非薪资面议_学历"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 204,
   "id": "add00dae",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>行业</th>\n",
       "      <th>平均薪资</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>63</th>\n",
       "      <td>科技金融</td>\n",
       "      <td>3.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>旅游</td>\n",
       "      <td>5.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>学校教育</td>\n",
       "      <td>5.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>家政服务</td>\n",
       "      <td>5.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>61</th>\n",
       "      <td>矿产开采</td>\n",
       "      <td>6.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>日化</td>\n",
       "      <td>17.5</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>50</th>\n",
       "      <td>机械/设备</td>\n",
       "      <td>20.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>基金/证券/投资</td>\n",
       "      <td>25.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>其他金融</td>\n",
       "      <td>25.0</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>人力资源服务</td>\n",
       "      <td>31.5</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>78 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "          行业  平均薪资\n",
       "63      科技金融   3.5\n",
       "46        旅游   5.0\n",
       "25      学校教育   5.0\n",
       "28      家政服务   5.5\n",
       "61      矿产开采   6.0\n",
       "..       ...   ...\n",
       "47        日化  17.5\n",
       "50     机械/设备  20.0\n",
       "22  基金/证券/投资  25.0\n",
       "12      其他金融  25.0\n",
       "5     人力资源服务  31.5\n",
       "\n",
       "[78 rows x 2 columns]"
      ]
     },
     "execution_count": 204,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 行业\n",
    "非薪资面议_行业 = df_非薪资面议.groupby('行业').agg({'平均薪资': 'median'}).reset_index().sort_values('平均薪资')\n",
    "非薪资面议_行业"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 205,
   "id": "b1ad6369",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>地区</th>\n",
       "      <th>行业</th>\n",
       "      <th>平均薪资</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>54</th>\n",
       "      <td>广州-南沙区</td>\n",
       "      <td>房地产租赁/中介</td>\n",
       "      <td>1.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>149</th>\n",
       "      <td>广州-番禺区</td>\n",
       "      <td>房地产开发经营</td>\n",
       "      <td>2.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>209</th>\n",
       "      <td>广州-荔湾区</td>\n",
       "      <td>学校教育</td>\n",
       "      <td>2.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>51</th>\n",
       "      <td>广州-南沙区</td>\n",
       "      <td>其他商务服务业</td>\n",
       "      <td>3.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>250</th>\n",
       "      <td>广州-黄埔区</td>\n",
       "      <td>酒店/民宿</td>\n",
       "      <td>4.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>105</th>\n",
       "      <td>广州-海珠区</td>\n",
       "      <td>IT服务</td>\n",
       "      <td>22.75</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>77</th>\n",
       "      <td>广州-天河区</td>\n",
       "      <td>在线社交/媒体</td>\n",
       "      <td>23.20</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>228</th>\n",
       "      <td>广州-越秀区</td>\n",
       "      <td>计算机软件</td>\n",
       "      <td>25.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>140</th>\n",
       "      <td>广州-番禺区</td>\n",
       "      <td>基金/证券/投资</td>\n",
       "      <td>25.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>166</th>\n",
       "      <td>广州-白云区</td>\n",
       "      <td>人力资源服务</td>\n",
       "      <td>31.50</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>207 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "         地区        行业   平均薪资\n",
       "54   广州-南沙区  房地产租赁/中介   1.50\n",
       "149  广州-番禺区   房地产开发经营   2.00\n",
       "209  广州-荔湾区      学校教育   2.50\n",
       "51   广州-南沙区   其他商务服务业   3.50\n",
       "250  广州-黄埔区     酒店/民宿   4.00\n",
       "..      ...       ...    ...\n",
       "105  广州-海珠区      IT服务  22.75\n",
       "77   广州-天河区   在线社交/媒体  23.20\n",
       "228  广州-越秀区     计算机软件  25.00\n",
       "140  广州-番禺区  基金/证券/投资  25.00\n",
       "166  广州-白云区    人力资源服务  31.50\n",
       "\n",
       "[207 rows x 3 columns]"
      ]
     },
     "execution_count": 205,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "非薪资面议_地区_行业 = df_非薪资面议.groupby(['地区','行业']).agg({'平均薪资': 'median'}).reset_index().query('地区!=\"广州\"').sort_values('平均薪资')\n",
    "非薪资面议_地区_行业"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 206,
   "id": "e177b504",
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>学历</th>\n",
       "      <th>行业</th>\n",
       "      <th>平均薪资</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>173</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>广播/影视/录音</td>\n",
       "      <td>2.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>144</th>\n",
       "      <td>本科</td>\n",
       "      <td>科技金融</td>\n",
       "      <td>3.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>175</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>房地产租赁/中介</td>\n",
       "      <td>3.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>78</th>\n",
       "      <td>学历不限</td>\n",
       "      <td>咨询服务</td>\n",
       "      <td>3.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>148</th>\n",
       "      <td>本科</td>\n",
       "      <td>运营商/增值服务</td>\n",
       "      <td>3.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>170</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>基金/证券/投资</td>\n",
       "      <td>25.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>165</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>其他金融</td>\n",
       "      <td>25.00</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>70</th>\n",
       "      <td>大专及以上</td>\n",
       "      <td>电子商务</td>\n",
       "      <td>26.75</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>182</th>\n",
       "      <td>统招本科</td>\n",
       "      <td>货运/物流/仓储</td>\n",
       "      <td>27.50</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>74</th>\n",
       "      <td>学历不限</td>\n",
       "      <td>人力资源服务</td>\n",
       "      <td>31.50</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>186 rows × 3 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "        学历        行业   平均薪资\n",
       "173   统招本科  广播/影视/录音   2.00\n",
       "144     本科      科技金融   3.50\n",
       "175   统招本科  房地产租赁/中介   3.50\n",
       "78    学历不限      咨询服务   3.50\n",
       "148     本科  运营商/增值服务   3.50\n",
       "..     ...       ...    ...\n",
       "170   统招本科  基金/证券/投资  25.00\n",
       "165   统招本科      其他金融  25.00\n",
       "70   大专及以上      电子商务  26.75\n",
       "182   统招本科  货运/物流/仓储  27.50\n",
       "74    学历不限    人力资源服务  31.50\n",
       "\n",
       "[186 rows x 3 columns]"
      ]
     },
     "execution_count": 206,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "非薪资面议_学历_行业 = df_非薪资面议.groupby(['学历','行业']).agg({'平均薪资': 'median'}).reset_index().sort_values('平均薪资')\n",
    "非薪资面议_学历_行业"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 207,
   "id": "9e4299be",
   "metadata": {},
   "outputs": [],
   "source": [
    "# 导出\n",
    "with pd.ExcelWriter(\"新媒体运营_薪资数据.xlsx\") as writer:\n",
    "    非薪资面议_地区.to_excel(writer, sheet_name = '地区',index=False)\n",
    "    非薪资面议_学历.to_excel(writer, sheet_name = '学历',index=False)\n",
    "    非薪资面议_行业.to_excel(writer, sheet_name = '行业',index=False)\n",
    "    非薪资面议_地区_行业.to_excel(writer, sheet_name = '地区_行业',index=False)\n",
    "    非薪资面议_学历_行业.to_excel(writer, sheet_name = '学历_地区',index=False)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "a599ed23",
   "metadata": {},
   "outputs": [],
   "source": []
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "id": "82b81dfc",
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.8"
  },
  "toc": {
   "base_numbering": 1,
   "nav_menu": {},
   "number_sections": true,
   "sideBar": true,
   "skip_h1_title": false,
   "title_cell": "Table of Contents",
   "title_sidebar": "Contents",
   "toc_cell": false,
   "toc_position": {},
   "toc_section_display": true,
   "toc_window_display": false
  }
 },
 "nbformat": 4,
 "nbformat_minor": 5
}
